{
  "best_metric": 2.0353407859802246,
  "best_model_checkpoint": "output_main/wandb/run-20240211_075351-8o9ldy4a/files/train_output/checkpoint-10000",
  "epoch": 2.042133333333333,
  "eval_steps": 500,
  "global_step": 10000,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "MSE": 892.0916341145833,
      "MSE/layer0": 892.0916341145833,
      "dead_code_fraction": 0.15045,
      "dead_code_fraction/layer0": 0.15045,
      "epoch": 0.0,
      "input_norm": 31.997259775797524,
      "input_norm/layer0": 31.997259775797524,
      "learning_rate": 1e-05,
      "loss": 8.134,
      "max_norm": 35.01011657714844,
      "max_norm/layer0": 35.01011657714844,
      "mean_norm": 31.990370750427246,
      "mean_norm/layer0": 31.990370750427246,
      "multicode_k": 1,
      "output_norm": 8.571834087371826,
      "output_norm/layer0": 8.571834087371826,
      "step": 1
    },
    {
      "MSE": 889.7418754733337,
      "MSE/layer0": 889.7418754733337,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.99632342656454,
      "input_norm/layer0": 31.99632342656454,
      "learning_rate": 0.0005,
      "loss": 7.1762,
      "max_norm": 35.03640365600586,
      "max_norm/layer0": 35.03640365600586,
      "mean_norm": 32.01236152648926,
      "mean_norm/layer0": 32.01236152648926,
      "multicode_k": 1,
      "output_norm": 8.591146861614817,
      "output_norm/layer0": 8.591146861614817,
      "step": 50
    },
    {
      "MSE": 869.5438468424481,
      "MSE/layer0": 869.5438468424481,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.996115023295076,
      "input_norm/layer0": 31.996115023295076,
      "learning_rate": 0.001,
      "loss": 5.0118,
      "max_norm": 35.15137481689453,
      "max_norm/layer0": 35.15137481689453,
      "mean_norm": 32.11746788024902,
      "mean_norm/layer0": 32.11746788024902,
      "multicode_k": 1,
      "output_norm": 8.768607576688133,
      "output_norm/layer0": 8.768607576688133,
      "step": 100
    },
    {
      "MSE": 841.8395769246417,
      "MSE/layer0": 841.8395769246417,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.996588408152256,
      "input_norm/layer0": 31.996588408152256,
      "learning_rate": 0.0015,
      "loss": 4.2338,
      "max_norm": 35.45364761352539,
      "max_norm/layer0": 35.45364761352539,
      "mean_norm": 32.34040641784668,
      "mean_norm/layer0": 32.34040641784668,
      "multicode_k": 1,
      "output_norm": 9.237536044120787,
      "output_norm/layer0": 9.237536044120787,
      "step": 150
    },
    {
      "MSE": 817.2703357950843,
      "MSE/layer0": 817.2703357950843,
      "dead_code_fraction": 5e-05,
      "dead_code_fraction/layer0": 5e-05,
      "epoch": 0.02,
      "input_norm": 31.99718633969625,
      "input_norm/layer0": 31.99718633969625,
      "learning_rate": 0.002,
      "loss": 3.837,
      "max_norm": 36.11206817626953,
      "max_norm/layer0": 36.11206817626953,
      "mean_norm": 32.652212142944336,
      "mean_norm/layer0": 32.652212142944336,
      "multicode_k": 1,
      "output_norm": 9.962018431027724,
      "output_norm/layer0": 9.962018431027724,
      "step": 200
    },
    {
      "MSE": 787.4571261596678,
      "MSE/layer0": 787.4571261596678,
      "dead_code_fraction": 0.0028,
      "dead_code_fraction/layer0": 0.0028,
      "epoch": 0.03,
      "input_norm": 31.99750740687052,
      "input_norm/layer0": 31.99750740687052,
      "learning_rate": 0.0025,
      "loss": 3.5507,
      "max_norm": 37.03396987915039,
      "max_norm/layer0": 37.03396987915039,
      "mean_norm": 33.030792236328125,
      "mean_norm/layer0": 33.030792236328125,
      "multicode_k": 1,
      "output_norm": 11.101801137924198,
      "output_norm/layer0": 11.101801137924198,
      "step": 250
    },
    {
      "MSE": 759.7653246053058,
      "MSE/layer0": 759.7653246053058,
      "dead_code_fraction": 0.02905,
      "dead_code_fraction/layer0": 0.02905,
      "epoch": 0.03,
      "input_norm": 31.99749964078267,
      "input_norm/layer0": 31.99749964078267,
      "learning_rate": 0.003,
      "loss": 3.3015,
      "max_norm": 37.927757263183594,
      "max_norm/layer0": 37.927757263183594,
      "mean_norm": 33.33859634399414,
      "mean_norm/layer0": 33.33859634399414,
      "multicode_k": 1,
      "output_norm": 12.222484871546431,
      "output_norm/layer0": 12.222484871546431,
      "step": 300
    },
    {
      "MSE": 734.5841912841795,
      "MSE/layer0": 734.5841912841795,
      "dead_code_fraction": 0.06455,
      "dead_code_fraction/layer0": 0.06455,
      "epoch": 0.04,
      "input_norm": 31.99746166547139,
      "input_norm/layer0": 31.99746166547139,
      "learning_rate": 0.0034999999999999996,
      "loss": 3.1483,
      "max_norm": 40.570350646972656,
      "max_norm/layer0": 40.570350646972656,
      "mean_norm": 33.79829216003418,
      "mean_norm/layer0": 33.79829216003418,
      "multicode_k": 1,
      "output_norm": 13.233797086079917,
      "output_norm/layer0": 13.233797086079917,
      "step": 350
    },
    {
      "MSE": 705.9179516601566,
      "MSE/layer0": 705.9179516601566,
      "dead_code_fraction": 0.13495,
      "dead_code_fraction/layer0": 0.13495,
      "epoch": 0.04,
      "input_norm": 31.997578941980994,
      "input_norm/layer0": 31.997578941980994,
      "learning_rate": 0.004,
      "loss": 3.0479,
      "max_norm": 45.86402130126953,
      "max_norm/layer0": 45.86402130126953,
      "mean_norm": 34.60604667663574,
      "mean_norm/layer0": 34.60604667663574,
      "multicode_k": 1,
      "output_norm": 14.794977650642394,
      "output_norm/layer0": 14.794977650642394,
      "step": 400
    },
    {
      "MSE": 673.0142825317382,
      "MSE/layer0": 673.0142825317382,
      "dead_code_fraction": 0.236,
      "dead_code_fraction/layer0": 0.236,
      "epoch": 0.04,
      "input_norm": 31.99772956212363,
      "input_norm/layer0": 31.99772956212363,
      "learning_rate": 0.0045000000000000005,
      "loss": 2.9234,
      "max_norm": 50.35022735595703,
      "max_norm/layer0": 50.35022735595703,
      "mean_norm": 35.50743293762207,
      "mean_norm/layer0": 35.50743293762207,
      "multicode_k": 1,
      "output_norm": 16.412540513674415,
      "output_norm/layer0": 16.412540513674415,
      "step": 450
    },
    {
      "MSE": 646.1952704874673,
      "MSE/layer0": 646.1952704874673,
      "dead_code_fraction": 0.31565,
      "dead_code_fraction/layer0": 0.31565,
      "epoch": 0.05,
      "input_norm": 31.997816743850702,
      "input_norm/layer0": 31.997816743850702,
      "learning_rate": 0.005,
      "loss": 2.8364,
      "max_norm": 55.06960678100586,
      "max_norm/layer0": 55.06960678100586,
      "mean_norm": 36.40013122558594,
      "mean_norm/layer0": 36.40013122558594,
      "multicode_k": 1,
      "output_norm": 17.61372879664104,
      "output_norm/layer0": 17.61372879664104,
      "step": 500
    },
    {
      "epoch": 0.05,
      "eval_MSE/layer0": 634.8931657946682,
      "eval_accuracy": 0.42267877747562077,
      "eval_dead_code_fraction/layer0": 0.3619,
      "eval_input_norm/layer0": 31.9978586178746,
      "eval_loss": 2.7649216651916504,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.081893277070293,
      "eval_runtime": 157.3558,
      "eval_samples_per_second": 29.379,
      "eval_steps_per_second": 1.837,
      "step": 500
    },
    {
      "MSE": 627.919213663737,
      "MSE/layer0": 627.919213663737,
      "dead_code_fraction": 0.35455,
      "dead_code_fraction/layer0": 0.35455,
      "epoch": 0.06,
      "input_norm": 31.997863556543983,
      "input_norm/layer0": 31.997863556543983,
      "learning_rate": 0.005,
      "loss": 2.6999,
      "max_norm": 59.44381332397461,
      "max_norm/layer0": 59.44381332397461,
      "mean_norm": 37.23677062988281,
      "mean_norm/layer0": 37.23677062988281,
      "multicode_k": 1,
      "output_norm": 18.411861616770416,
      "output_norm/layer0": 18.411861616770416,
      "step": 550
    },
    {
      "MSE": 613.3249330647789,
      "MSE/layer0": 613.3249330647789,
      "dead_code_fraction": 0.38215,
      "dead_code_fraction/layer0": 0.38215,
      "epoch": 0.06,
      "input_norm": 31.99789684613545,
      "input_norm/layer0": 31.99789684613545,
      "learning_rate": 0.005,
      "loss": 2.6511,
      "max_norm": 66.23004150390625,
      "max_norm/layer0": 66.23004150390625,
      "mean_norm": 38.00171661376953,
      "mean_norm/layer0": 38.00171661376953,
      "multicode_k": 1,
      "output_norm": 18.973640613555915,
      "output_norm/layer0": 18.973640613555915,
      "step": 600
    },
    {
      "MSE": 601.0688813273114,
      "MSE/layer0": 601.0688813273114,
      "dead_code_fraction": 0.3855,
      "dead_code_fraction/layer0": 0.3855,
      "epoch": 0.07,
      "input_norm": 31.997907568613698,
      "input_norm/layer0": 31.997907568613698,
      "learning_rate": 0.005,
      "loss": 2.5727,
      "max_norm": 72.61077117919922,
      "max_norm/layer0": 72.61077117919922,
      "mean_norm": 38.68782615661621,
      "mean_norm/layer0": 38.68782615661621,
      "multicode_k": 1,
      "output_norm": 19.389015719095863,
      "output_norm/layer0": 19.389015719095863,
      "step": 650
    },
    {
      "MSE": 595.7544806925458,
      "MSE/layer0": 595.7544806925458,
      "dead_code_fraction": 0.3847,
      "dead_code_fraction/layer0": 0.3847,
      "epoch": 0.07,
      "input_norm": 31.99792699813842,
      "input_norm/layer0": 31.99792699813842,
      "learning_rate": 0.005,
      "loss": 2.5303,
      "max_norm": 77.1572036743164,
      "max_norm/layer0": 77.1572036743164,
      "mean_norm": 39.301788330078125,
      "mean_norm/layer0": 39.301788330078125,
      "multicode_k": 1,
      "output_norm": 19.654865121841446,
      "output_norm/layer0": 19.654865121841446,
      "step": 700
    },
    {
      "MSE": 587.4001970418295,
      "MSE/layer0": 587.4001970418295,
      "dead_code_fraction": 0.38495,
      "dead_code_fraction/layer0": 0.38495,
      "epoch": 0.07,
      "input_norm": 31.997964229583737,
      "input_norm/layer0": 31.997964229583737,
      "learning_rate": 0.005,
      "loss": 2.5181,
      "max_norm": 81.00206756591797,
      "max_norm/layer0": 81.00206756591797,
      "mean_norm": 39.8663330078125,
      "mean_norm/layer0": 39.8663330078125,
      "multicode_k": 1,
      "output_norm": 19.91484704653422,
      "output_norm/layer0": 19.91484704653422,
      "step": 750
    },
    {
      "MSE": 582.8578649902345,
      "MSE/layer0": 582.8578649902345,
      "dead_code_fraction": 0.37595,
      "dead_code_fraction/layer0": 0.37595,
      "epoch": 0.08,
      "input_norm": 31.997961613337196,
      "input_norm/layer0": 31.997961613337196,
      "learning_rate": 0.005,
      "loss": 2.488,
      "max_norm": 84.8564682006836,
      "max_norm/layer0": 84.8564682006836,
      "mean_norm": 40.41610145568848,
      "mean_norm/layer0": 40.41610145568848,
      "multicode_k": 1,
      "output_norm": 20.113984060287464,
      "output_norm/layer0": 20.113984060287464,
      "step": 800
    },
    {
      "MSE": 578.7394322713219,
      "MSE/layer0": 578.7394322713219,
      "dead_code_fraction": 0.36775,
      "dead_code_fraction/layer0": 0.36775,
      "epoch": 0.09,
      "input_norm": 31.99793098767598,
      "input_norm/layer0": 31.99793098767598,
      "learning_rate": 0.005,
      "loss": 2.3972,
      "max_norm": 88.52584838867188,
      "max_norm/layer0": 88.52584838867188,
      "mean_norm": 40.93037033081055,
      "mean_norm/layer0": 40.93037033081055,
      "multicode_k": 1,
      "output_norm": 20.255761035283413,
      "output_norm/layer0": 20.255761035283413,
      "step": 850
    },
    {
      "MSE": 574.7943645222981,
      "MSE/layer0": 574.7943645222981,
      "dead_code_fraction": 0.3752,
      "dead_code_fraction/layer0": 0.3752,
      "epoch": 0.09,
      "input_norm": 31.99794203122458,
      "input_norm/layer0": 31.99794203122458,
      "learning_rate": 0.005,
      "loss": 2.4475,
      "max_norm": 91.37139129638672,
      "max_norm/layer0": 91.37139129638672,
      "mean_norm": 41.42861366271973,
      "mean_norm/layer0": 41.42861366271973,
      "multicode_k": 1,
      "output_norm": 20.38246509869893,
      "output_norm/layer0": 20.38246509869893,
      "step": 900
    },
    {
      "MSE": 572.0475691731768,
      "MSE/layer0": 572.0475691731768,
      "dead_code_fraction": 0.369,
      "dead_code_fraction/layer0": 0.369,
      "epoch": 0.1,
      "input_norm": 31.997947810490906,
      "input_norm/layer0": 31.997947810490906,
      "learning_rate": 0.005,
      "loss": 2.3928,
      "max_norm": 93.76451873779297,
      "max_norm/layer0": 93.76451873779297,
      "mean_norm": 41.89710807800293,
      "mean_norm/layer0": 41.89710807800293,
      "multicode_k": 1,
      "output_norm": 20.522438500722256,
      "output_norm/layer0": 20.522438500722256,
      "step": 950
    },
    {
      "MSE": 571.223816274007,
      "MSE/layer0": 571.223816274007,
      "dead_code_fraction": 0.35845,
      "dead_code_fraction/layer0": 0.35845,
      "epoch": 0.1,
      "input_norm": 31.997930752436314,
      "input_norm/layer0": 31.997930752436314,
      "learning_rate": 0.005,
      "loss": 2.3611,
      "max_norm": 95.86876678466797,
      "max_norm/layer0": 95.86876678466797,
      "mean_norm": 42.36003875732422,
      "mean_norm/layer0": 42.36003875732422,
      "multicode_k": 1,
      "output_norm": 20.59194125175477,
      "output_norm/layer0": 20.59194125175477,
      "step": 1000
    },
    {
      "epoch": 0.1,
      "eval_MSE/layer0": 568.7263942209383,
      "eval_accuracy": 0.47120194006380184,
      "eval_dead_code_fraction/layer0": 0.36065,
      "eval_input_norm/layer0": 31.997911268824648,
      "eval_loss": 2.370492935180664,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 20.66302644662364,
      "eval_runtime": 157.3974,
      "eval_samples_per_second": 29.372,
      "eval_steps_per_second": 1.836,
      "step": 1000
    },
    {
      "MSE": 568.216246948242,
      "MSE/layer0": 568.216246948242,
      "dead_code_fraction": 0.35655,
      "dead_code_fraction/layer0": 0.35655,
      "epoch": 0.1,
      "input_norm": 31.997933057149254,
      "input_norm/layer0": 31.997933057149254,
      "learning_rate": 0.005,
      "loss": 2.3877,
      "max_norm": 97.93981170654297,
      "max_norm/layer0": 97.93981170654297,
      "mean_norm": 42.796369552612305,
      "mean_norm/layer0": 42.796369552612305,
      "multicode_k": 1,
      "output_norm": 20.69294343630473,
      "output_norm/layer0": 20.69294343630473,
      "step": 1050
    },
    {
      "MSE": 566.0765097045902,
      "MSE/layer0": 566.0765097045902,
      "dead_code_fraction": 0.3515,
      "dead_code_fraction/layer0": 0.3515,
      "epoch": 0.11,
      "input_norm": 31.997944701512658,
      "input_norm/layer0": 31.997944701512658,
      "learning_rate": 0.005,
      "loss": 2.32,
      "max_norm": 99.40829467773438,
      "max_norm/layer0": 99.40829467773438,
      "mean_norm": 43.20481872558594,
      "mean_norm/layer0": 43.20481872558594,
      "multicode_k": 1,
      "output_norm": 20.780460087458298,
      "output_norm/layer0": 20.780460087458298,
      "step": 1100
    },
    {
      "MSE": 563.1435256449383,
      "MSE/layer0": 563.1435256449383,
      "dead_code_fraction": 0.3425,
      "dead_code_fraction/layer0": 0.3425,
      "epoch": 0.12,
      "input_norm": 31.99793601353964,
      "input_norm/layer0": 31.99793601353964,
      "learning_rate": 0.005,
      "loss": 2.3309,
      "max_norm": 100.84235382080078,
      "max_norm/layer0": 100.84235382080078,
      "mean_norm": 43.63128852844238,
      "mean_norm/layer0": 43.63128852844238,
      "multicode_k": 1,
      "output_norm": 20.85479287147521,
      "output_norm/layer0": 20.85479287147521,
      "step": 1150
    },
    {
      "MSE": 561.2093427530926,
      "MSE/layer0": 561.2093427530926,
      "dead_code_fraction": 0.3403,
      "dead_code_fraction/layer0": 0.3403,
      "epoch": 0.12,
      "input_norm": 31.99792865435282,
      "input_norm/layer0": 31.99792865435282,
      "learning_rate": 0.005,
      "loss": 2.3308,
      "max_norm": 102.74110412597656,
      "max_norm/layer0": 102.74110412597656,
      "mean_norm": 44.03978157043457,
      "mean_norm/layer0": 44.03978157043457,
      "multicode_k": 1,
      "output_norm": 20.931864147186282,
      "output_norm/layer0": 20.931864147186282,
      "step": 1200
    },
    {
      "MSE": 559.3785518391925,
      "MSE/layer0": 559.3785518391925,
      "dead_code_fraction": 0.3412,
      "dead_code_fraction/layer0": 0.3412,
      "epoch": 0.12,
      "input_norm": 31.99792771339417,
      "input_norm/layer0": 31.99792771339417,
      "learning_rate": 0.005,
      "loss": 2.3437,
      "max_norm": 104.6494369506836,
      "max_norm/layer0": 104.6494369506836,
      "mean_norm": 44.438026428222656,
      "mean_norm/layer0": 44.438026428222656,
      "multicode_k": 1,
      "output_norm": 21.008427244822187,
      "output_norm/layer0": 21.008427244822187,
      "step": 1250
    },
    {
      "MSE": 557.9434753417968,
      "MSE/layer0": 557.9434753417968,
      "dead_code_fraction": 0.33015,
      "dead_code_fraction/layer0": 0.33015,
      "epoch": 0.13,
      "input_norm": 31.997915770212824,
      "input_norm/layer0": 31.997915770212824,
      "learning_rate": 0.005,
      "loss": 2.2785,
      "max_norm": 106.27558135986328,
      "max_norm/layer0": 106.27558135986328,
      "mean_norm": 44.82562255859375,
      "mean_norm/layer0": 44.82562255859375,
      "multicode_k": 1,
      "output_norm": 21.07806761741638,
      "output_norm/layer0": 21.07806761741638,
      "step": 1300
    },
    {
      "MSE": 556.1554424031574,
      "MSE/layer0": 556.1554424031574,
      "dead_code_fraction": 0.3277,
      "dead_code_fraction/layer0": 0.3277,
      "epoch": 0.14,
      "input_norm": 31.9979051399231,
      "input_norm/layer0": 31.9979051399231,
      "learning_rate": 0.005,
      "loss": 2.2823,
      "max_norm": 107.8658676147461,
      "max_norm/layer0": 107.8658676147461,
      "mean_norm": 45.21988105773926,
      "mean_norm/layer0": 45.21988105773926,
      "multicode_k": 1,
      "output_norm": 21.124666048685715,
      "output_norm/layer0": 21.124666048685715,
      "step": 1350
    },
    {
      "MSE": 554.1472004191082,
      "MSE/layer0": 554.1472004191082,
      "dead_code_fraction": 0.32535,
      "dead_code_fraction/layer0": 0.32535,
      "epoch": 0.14,
      "input_norm": 31.99791674613953,
      "input_norm/layer0": 31.99791674613953,
      "learning_rate": 0.005,
      "loss": 2.3034,
      "max_norm": 109.18831634521484,
      "max_norm/layer0": 109.18831634521484,
      "mean_norm": 45.60391616821289,
      "mean_norm/layer0": 45.60391616821289,
      "multicode_k": 1,
      "output_norm": 21.184103918075557,
      "output_norm/layer0": 21.184103918075557,
      "step": 1400
    },
    {
      "MSE": 553.0813423156735,
      "MSE/layer0": 553.0813423156735,
      "dead_code_fraction": 0.3218,
      "dead_code_fraction/layer0": 0.3218,
      "epoch": 0.14,
      "input_norm": 31.997899109522507,
      "input_norm/layer0": 31.997899109522507,
      "learning_rate": 0.005,
      "loss": 2.2583,
      "max_norm": 110.68695831298828,
      "max_norm/layer0": 110.68695831298828,
      "mean_norm": 45.98097801208496,
      "mean_norm/layer0": 45.98097801208496,
      "multicode_k": 1,
      "output_norm": 21.234303328196226,
      "output_norm/layer0": 21.234303328196226,
      "step": 1450
    },
    {
      "MSE": 551.1942003377276,
      "MSE/layer0": 551.1942003377276,
      "dead_code_fraction": 0.32175,
      "dead_code_fraction/layer0": 0.32175,
      "epoch": 0.15,
      "input_norm": 31.997910699844365,
      "input_norm/layer0": 31.997910699844365,
      "learning_rate": 0.005,
      "loss": 2.2395,
      "max_norm": 112.16923522949219,
      "max_norm/layer0": 112.16923522949219,
      "mean_norm": 46.355411529541016,
      "mean_norm/layer0": 46.355411529541016,
      "multicode_k": 1,
      "output_norm": 21.303704795837398,
      "output_norm/layer0": 21.303704795837398,
      "step": 1500
    },
    {
      "epoch": 0.15,
      "eval_MSE/layer0": 550.3311246673497,
      "eval_accuracy": 0.486590169556823,
      "eval_dead_code_fraction/layer0": 0.32665,
      "eval_input_norm/layer0": 31.99789719372221,
      "eval_loss": 2.253082513809204,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 21.329729693291277,
      "eval_runtime": 160.4576,
      "eval_samples_per_second": 28.811,
      "eval_steps_per_second": 1.801,
      "step": 1500
    },
    {
      "MSE": 551.4163179524738,
      "MSE/layer0": 551.4163179524738,
      "dead_code_fraction": 0.3174,
      "dead_code_fraction/layer0": 0.3174,
      "epoch": 0.15,
      "input_norm": 31.997892700831095,
      "input_norm/layer0": 31.997892700831095,
      "learning_rate": 0.005,
      "loss": 2.1968,
      "max_norm": 113.21269989013672,
      "max_norm/layer0": 113.21269989013672,
      "mean_norm": 46.7271785736084,
      "mean_norm/layer0": 46.7271785736084,
      "multicode_k": 1,
      "output_norm": 21.321544698079432,
      "output_norm/layer0": 21.321544698079432,
      "step": 1550
    },
    {
      "MSE": 549.0553175354001,
      "MSE/layer0": 549.0553175354001,
      "dead_code_fraction": 0.31715,
      "dead_code_fraction/layer0": 0.31715,
      "epoch": 0.16,
      "input_norm": 31.99791664441427,
      "input_norm/layer0": 31.99791664441427,
      "learning_rate": 0.005,
      "loss": 2.2863,
      "max_norm": 114.45362854003906,
      "max_norm/layer0": 114.45362854003906,
      "mean_norm": 47.08230972290039,
      "mean_norm/layer0": 47.08230972290039,
      "multicode_k": 1,
      "output_norm": 21.38125430742899,
      "output_norm/layer0": 21.38125430742899,
      "step": 1600
    },
    {
      "MSE": 547.4109810384114,
      "MSE/layer0": 547.4109810384114,
      "dead_code_fraction": 0.3131,
      "dead_code_fraction/layer0": 0.3131,
      "epoch": 0.17,
      "input_norm": 31.997924680709843,
      "input_norm/layer0": 31.997924680709843,
      "learning_rate": 0.005,
      "loss": 2.2147,
      "max_norm": 115.29362487792969,
      "max_norm/layer0": 115.29362487792969,
      "mean_norm": 47.438798904418945,
      "mean_norm/layer0": 47.438798904418945,
      "multicode_k": 1,
      "output_norm": 21.454637037913013,
      "output_norm/layer0": 21.454637037913013,
      "step": 1650
    },
    {
      "MSE": 546.0445864868163,
      "MSE/layer0": 546.0445864868163,
      "dead_code_fraction": 0.31475,
      "dead_code_fraction/layer0": 0.31475,
      "epoch": 0.17,
      "input_norm": 31.997929503122954,
      "input_norm/layer0": 31.997929503122954,
      "learning_rate": 0.005,
      "loss": 2.2501,
      "max_norm": 116.09871673583984,
      "max_norm/layer0": 116.09871673583984,
      "mean_norm": 47.79398536682129,
      "mean_norm/layer0": 47.79398536682129,
      "multicode_k": 1,
      "output_norm": 21.4808695602417,
      "output_norm/layer0": 21.4808695602417,
      "step": 1700
    },
    {
      "MSE": 545.4600128173831,
      "MSE/layer0": 545.4600128173831,
      "dead_code_fraction": 0.30905,
      "dead_code_fraction/layer0": 0.30905,
      "epoch": 0.17,
      "input_norm": 31.997937501271572,
      "input_norm/layer0": 31.997937501271572,
      "learning_rate": 0.005,
      "loss": 2.2296,
      "max_norm": 117.0920181274414,
      "max_norm/layer0": 117.0920181274414,
      "mean_norm": 48.138267517089844,
      "mean_norm/layer0": 48.138267517089844,
      "multicode_k": 1,
      "output_norm": 21.52623297691346,
      "output_norm/layer0": 21.52623297691346,
      "step": 1750
    },
    {
      "MSE": 543.9589634704591,
      "MSE/layer0": 543.9589634704591,
      "dead_code_fraction": 0.3074,
      "dead_code_fraction/layer0": 0.3074,
      "epoch": 0.18,
      "input_norm": 31.997916940053315,
      "input_norm/layer0": 31.997916940053315,
      "learning_rate": 0.005,
      "loss": 2.1632,
      "max_norm": 118.44883728027344,
      "max_norm/layer0": 118.44883728027344,
      "mean_norm": 48.48598670959473,
      "mean_norm/layer0": 48.48598670959473,
      "multicode_k": 1,
      "output_norm": 21.572722558975222,
      "output_norm/layer0": 21.572722558975222,
      "step": 1800
    },
    {
      "MSE": 543.3154680887858,
      "MSE/layer0": 543.3154680887858,
      "dead_code_fraction": 0.30485,
      "dead_code_fraction/layer0": 0.30485,
      "epoch": 0.18,
      "input_norm": 31.997930173873904,
      "input_norm/layer0": 31.997930173873904,
      "learning_rate": 0.005,
      "loss": 2.1874,
      "max_norm": 119.3927001953125,
      "max_norm/layer0": 119.3927001953125,
      "mean_norm": 48.82695388793945,
      "mean_norm/layer0": 48.82695388793945,
      "multicode_k": 1,
      "output_norm": 21.595847959518437,
      "output_norm/layer0": 21.595847959518437,
      "step": 1850
    },
    {
      "MSE": 542.2137928263345,
      "MSE/layer0": 542.2137928263345,
      "dead_code_fraction": 0.30715,
      "dead_code_fraction/layer0": 0.30715,
      "epoch": 0.19,
      "input_norm": 31.997955802281705,
      "input_norm/layer0": 31.997955802281705,
      "learning_rate": 0.005,
      "loss": 2.2323,
      "max_norm": 121.5817642211914,
      "max_norm/layer0": 121.5817642211914,
      "mean_norm": 49.15649604797363,
      "mean_norm/layer0": 49.15649604797363,
      "multicode_k": 1,
      "output_norm": 21.63884919484457,
      "output_norm/layer0": 21.63884919484457,
      "step": 1900
    },
    {
      "MSE": 539.4505286661786,
      "MSE/layer0": 539.4505286661786,
      "dead_code_fraction": 0.3033,
      "dead_code_fraction/layer0": 0.3033,
      "epoch": 0.2,
      "input_norm": 31.997942549387595,
      "input_norm/layer0": 31.997942549387595,
      "learning_rate": 0.005,
      "loss": 2.1894,
      "max_norm": 123.63184356689453,
      "max_norm/layer0": 123.63184356689453,
      "mean_norm": 49.49074363708496,
      "mean_norm/layer0": 49.49074363708496,
      "multicode_k": 1,
      "output_norm": 21.689245723088575,
      "output_norm/layer0": 21.689245723088575,
      "step": 1950
    },
    {
      "MSE": 539.8872321573892,
      "MSE/layer0": 539.8872321573892,
      "dead_code_fraction": 0.29975,
      "dead_code_fraction/layer0": 0.29975,
      "epoch": 0.2,
      "input_norm": 31.997952289581303,
      "input_norm/layer0": 31.997952289581303,
      "learning_rate": 0.005,
      "loss": 2.1999,
      "max_norm": 125.97776794433594,
      "max_norm/layer0": 125.97776794433594,
      "mean_norm": 49.814876556396484,
      "mean_norm/layer0": 49.814876556396484,
      "multicode_k": 1,
      "output_norm": 21.72016517957053,
      "output_norm/layer0": 21.72016517957053,
      "step": 2000
    },
    {
      "epoch": 0.2,
      "eval_MSE/layer0": 539.0149815035619,
      "eval_accuracy": 0.4955417565578542,
      "eval_dead_code_fraction/layer0": 0.30475,
      "eval_input_norm/layer0": 31.997959356660743,
      "eval_loss": 2.1908392906188965,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 21.766283075917258,
      "eval_runtime": 158.005,
      "eval_samples_per_second": 29.259,
      "eval_steps_per_second": 1.829,
      "step": 2000
    },
    {
      "MSE": 538.042401936849,
      "MSE/layer0": 538.042401936849,
      "dead_code_fraction": 0.30175,
      "dead_code_fraction/layer0": 0.30175,
      "epoch": 0.2,
      "input_norm": 31.99795293172201,
      "input_norm/layer0": 31.99795293172201,
      "learning_rate": 0.005,
      "loss": 2.1768,
      "max_norm": 127.91316986083984,
      "max_norm/layer0": 127.91316986083984,
      "mean_norm": 50.13774490356445,
      "mean_norm/layer0": 50.13774490356445,
      "multicode_k": 1,
      "output_norm": 21.768677377700797,
      "output_norm/layer0": 21.768677377700797,
      "step": 2050
    },
    {
      "MSE": 537.4139138285318,
      "MSE/layer0": 537.4139138285318,
      "dead_code_fraction": 0.29605,
      "dead_code_fraction/layer0": 0.29605,
      "epoch": 0.21,
      "input_norm": 31.997954098383584,
      "input_norm/layer0": 31.997954098383584,
      "learning_rate": 0.005,
      "loss": 2.1417,
      "max_norm": 129.62669372558594,
      "max_norm/layer0": 129.62669372558594,
      "mean_norm": 50.44980430603027,
      "mean_norm/layer0": 50.44980430603027,
      "multicode_k": 1,
      "output_norm": 21.780523262023927,
      "output_norm/layer0": 21.780523262023927,
      "step": 2100
    },
    {
      "MSE": 537.116479644775,
      "MSE/layer0": 537.116479644775,
      "dead_code_fraction": 0.298,
      "dead_code_fraction/layer0": 0.298,
      "epoch": 0.21,
      "input_norm": 31.99796335220337,
      "input_norm/layer0": 31.99796335220337,
      "learning_rate": 0.005,
      "loss": 2.1753,
      "max_norm": 131.71987915039062,
      "max_norm/layer0": 131.71987915039062,
      "mean_norm": 50.758169174194336,
      "mean_norm/layer0": 50.758169174194336,
      "multicode_k": 1,
      "output_norm": 21.819064016342168,
      "output_norm/layer0": 21.819064016342168,
      "step": 2150
    },
    {
      "MSE": 536.1095620218915,
      "MSE/layer0": 536.1095620218915,
      "dead_code_fraction": 0.29655,
      "dead_code_fraction/layer0": 0.29655,
      "epoch": 0.22,
      "input_norm": 31.997976016998287,
      "input_norm/layer0": 31.997976016998287,
      "learning_rate": 0.005,
      "loss": 2.1676,
      "max_norm": 133.67694091796875,
      "max_norm/layer0": 133.67694091796875,
      "mean_norm": 51.058135986328125,
      "mean_norm/layer0": 51.058135986328125,
      "multicode_k": 1,
      "output_norm": 21.83967799504598,
      "output_norm/layer0": 21.83967799504598,
      "step": 2200
    },
    {
      "MSE": 535.5964339701336,
      "MSE/layer0": 535.5964339701336,
      "dead_code_fraction": 0.2945,
      "dead_code_fraction/layer0": 0.2945,
      "epoch": 0.23,
      "input_norm": 31.997973279952987,
      "input_norm/layer0": 31.997973279952987,
      "learning_rate": 0.005,
      "loss": 2.1347,
      "max_norm": 135.40386962890625,
      "max_norm/layer0": 135.40386962890625,
      "mean_norm": 51.35656929016113,
      "mean_norm/layer0": 51.35656929016113,
      "multicode_k": 1,
      "output_norm": 21.857111148834242,
      "output_norm/layer0": 21.857111148834242,
      "step": 2250
    },
    {
      "MSE": 534.8214352925618,
      "MSE/layer0": 534.8214352925618,
      "dead_code_fraction": 0.2943,
      "dead_code_fraction/layer0": 0.2943,
      "epoch": 0.23,
      "input_norm": 31.99798300425212,
      "input_norm/layer0": 31.99798300425212,
      "learning_rate": 0.005,
      "loss": 2.1712,
      "max_norm": 137.13648986816406,
      "max_norm/layer0": 137.13648986816406,
      "mean_norm": 51.64659118652344,
      "mean_norm/layer0": 51.64659118652344,
      "multicode_k": 1,
      "output_norm": 21.901708291371662,
      "output_norm/layer0": 21.901708291371662,
      "step": 2300
    },
    {
      "MSE": 533.4100613403319,
      "MSE/layer0": 533.4100613403319,
      "dead_code_fraction": 0.29105,
      "dead_code_fraction/layer0": 0.29105,
      "epoch": 0.23,
      "input_norm": 31.99798559824626,
      "input_norm/layer0": 31.99798559824626,
      "learning_rate": 0.005,
      "loss": 2.1726,
      "max_norm": 138.62417602539062,
      "max_norm/layer0": 138.62417602539062,
      "mean_norm": 51.931190490722656,
      "mean_norm/layer0": 51.931190490722656,
      "multicode_k": 1,
      "output_norm": 21.91944276809694,
      "output_norm/layer0": 21.91944276809694,
      "step": 2350
    },
    {
      "MSE": 533.0944277445471,
      "MSE/layer0": 533.0944277445471,
      "dead_code_fraction": 0.29235,
      "dead_code_fraction/layer0": 0.29235,
      "epoch": 0.24,
      "input_norm": 31.99797873497009,
      "input_norm/layer0": 31.99797873497009,
      "learning_rate": 0.005,
      "loss": 2.1496,
      "max_norm": 140.219970703125,
      "max_norm/layer0": 140.219970703125,
      "mean_norm": 52.213850021362305,
      "mean_norm/layer0": 52.213850021362305,
      "multicode_k": 1,
      "output_norm": 21.941968046824137,
      "output_norm/layer0": 21.941968046824137,
      "step": 2400
    },
    {
      "MSE": 531.4289741007487,
      "MSE/layer0": 531.4289741007487,
      "dead_code_fraction": 0.29335,
      "dead_code_fraction/layer0": 0.29335,
      "epoch": 0.24,
      "input_norm": 31.998000961939493,
      "input_norm/layer0": 31.998000961939493,
      "learning_rate": 0.005,
      "loss": 2.153,
      "max_norm": 141.84396362304688,
      "max_norm/layer0": 141.84396362304688,
      "mean_norm": 52.47932052612305,
      "mean_norm/layer0": 52.47932052612305,
      "multicode_k": 1,
      "output_norm": 21.982840156555177,
      "output_norm/layer0": 21.982840156555177,
      "step": 2450
    },
    {
      "MSE": 531.2627974446617,
      "MSE/layer0": 531.2627974446617,
      "dead_code_fraction": 0.28885,
      "dead_code_fraction/layer0": 0.28885,
      "epoch": 0.25,
      "input_norm": 31.99799962997436,
      "input_norm/layer0": 31.99799962997436,
      "learning_rate": 0.005,
      "loss": 2.1688,
      "max_norm": 143.0140838623047,
      "max_norm/layer0": 143.0140838623047,
      "mean_norm": 52.74382019042969,
      "mean_norm/layer0": 52.74382019042969,
      "multicode_k": 1,
      "output_norm": 22.00004559199015,
      "output_norm/layer0": 22.00004559199015,
      "step": 2500
    },
    {
      "epoch": 0.25,
      "eval_MSE/layer0": 530.4651256365718,
      "eval_accuracy": 0.5006363482007701,
      "eval_dead_code_fraction/layer0": 0.29495,
      "eval_input_norm/layer0": 31.99800563596064,
      "eval_loss": 2.155103921890259,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.022818533393835,
      "eval_runtime": 157.5009,
      "eval_samples_per_second": 29.352,
      "eval_steps_per_second": 1.835,
      "step": 2500
    },
    {
      "MSE": 530.4989952596026,
      "MSE/layer0": 530.4989952596026,
      "dead_code_fraction": 0.29025,
      "dead_code_fraction/layer0": 0.29025,
      "epoch": 0.26,
      "input_norm": 31.99801852544149,
      "input_norm/layer0": 31.99801852544149,
      "learning_rate": 0.005,
      "loss": 2.1541,
      "max_norm": 144.50558471679688,
      "max_norm/layer0": 144.50558471679688,
      "mean_norm": 52.992868423461914,
      "mean_norm/layer0": 52.992868423461914,
      "multicode_k": 1,
      "output_norm": 22.044915301005062,
      "output_norm/layer0": 22.044915301005062,
      "step": 2550
    },
    {
      "MSE": 529.2955647786457,
      "MSE/layer0": 529.2955647786457,
      "dead_code_fraction": 0.288,
      "dead_code_fraction/layer0": 0.288,
      "epoch": 0.26,
      "input_norm": 31.998021106719975,
      "input_norm/layer0": 31.998021106719975,
      "learning_rate": 0.005,
      "loss": 2.1563,
      "max_norm": 146.2478485107422,
      "max_norm/layer0": 146.2478485107422,
      "mean_norm": 53.24601364135742,
      "mean_norm/layer0": 53.24601364135742,
      "multicode_k": 1,
      "output_norm": 22.048689235051476,
      "output_norm/layer0": 22.048689235051476,
      "step": 2600
    },
    {
      "MSE": 529.877343190511,
      "MSE/layer0": 529.877343190511,
      "dead_code_fraction": 0.288,
      "dead_code_fraction/layer0": 0.288,
      "epoch": 0.27,
      "input_norm": 31.998024587631217,
      "input_norm/layer0": 31.998024587631217,
      "learning_rate": 0.005,
      "loss": 2.1382,
      "max_norm": 147.41587829589844,
      "max_norm/layer0": 147.41587829589844,
      "mean_norm": 53.48561096191406,
      "mean_norm/layer0": 53.48561096191406,
      "multicode_k": 1,
      "output_norm": 22.0797532526652,
      "output_norm/layer0": 22.0797532526652,
      "step": 2650
    },
    {
      "MSE": 528.3514750671387,
      "MSE/layer0": 528.3514750671387,
      "dead_code_fraction": 0.28825,
      "dead_code_fraction/layer0": 0.28825,
      "epoch": 0.27,
      "input_norm": 31.99804752349852,
      "input_norm/layer0": 31.99804752349852,
      "learning_rate": 0.005,
      "loss": 2.1742,
      "max_norm": 148.7862091064453,
      "max_norm/layer0": 148.7862091064453,
      "mean_norm": 53.71611213684082,
      "mean_norm/layer0": 53.71611213684082,
      "multicode_k": 1,
      "output_norm": 22.09869578997295,
      "output_norm/layer0": 22.09869578997295,
      "step": 2700
    },
    {
      "MSE": 528.2884072875979,
      "MSE/layer0": 528.2884072875979,
      "dead_code_fraction": 0.28335,
      "dead_code_fraction/layer0": 0.28335,
      "epoch": 0.28,
      "input_norm": 31.998042856852216,
      "input_norm/layer0": 31.998042856852216,
      "learning_rate": 0.005,
      "loss": 2.1277,
      "max_norm": 150.35140991210938,
      "max_norm/layer0": 150.35140991210938,
      "mean_norm": 53.946285247802734,
      "mean_norm/layer0": 53.946285247802734,
      "multicode_k": 1,
      "output_norm": 22.106029316584255,
      "output_norm/layer0": 22.106029316584255,
      "step": 2750
    },
    {
      "MSE": 527.2996965026854,
      "MSE/layer0": 527.2996965026854,
      "dead_code_fraction": 0.2844,
      "dead_code_fraction/layer0": 0.2844,
      "epoch": 0.28,
      "input_norm": 31.9980613454183,
      "input_norm/layer0": 31.9980613454183,
      "learning_rate": 0.005,
      "loss": 2.1676,
      "max_norm": 152.27590942382812,
      "max_norm/layer0": 152.27590942382812,
      "mean_norm": 54.16430473327637,
      "mean_norm/layer0": 54.16430473327637,
      "multicode_k": 1,
      "output_norm": 22.141783040364587,
      "output_norm/layer0": 22.141783040364587,
      "step": 2800
    },
    {
      "MSE": 527.5191156514486,
      "MSE/layer0": 527.5191156514486,
      "dead_code_fraction": 0.28045,
      "dead_code_fraction/layer0": 0.28045,
      "epoch": 0.28,
      "input_norm": 31.998067801793418,
      "input_norm/layer0": 31.998067801793418,
      "learning_rate": 0.005,
      "loss": 2.1076,
      "max_norm": 153.54779052734375,
      "max_norm/layer0": 153.54779052734375,
      "mean_norm": 54.38737678527832,
      "mean_norm/layer0": 54.38737678527832,
      "multicode_k": 1,
      "output_norm": 22.13956375757853,
      "output_norm/layer0": 22.13956375757853,
      "step": 2850
    },
    {
      "MSE": 527.3752633666991,
      "MSE/layer0": 527.3752633666991,
      "dead_code_fraction": 0.28165,
      "dead_code_fraction/layer0": 0.28165,
      "epoch": 0.29,
      "input_norm": 31.998070557912186,
      "input_norm/layer0": 31.998070557912186,
      "learning_rate": 0.005,
      "loss": 2.1379,
      "max_norm": 155.25857543945312,
      "max_norm/layer0": 155.25857543945312,
      "mean_norm": 54.598867416381836,
      "mean_norm/layer0": 54.598867416381836,
      "multicode_k": 1,
      "output_norm": 22.1554997475942,
      "output_norm/layer0": 22.1554997475942,
      "step": 2900
    },
    {
      "MSE": 525.2142114257812,
      "MSE/layer0": 525.2142114257812,
      "dead_code_fraction": 0.2841,
      "dead_code_fraction/layer0": 0.2841,
      "epoch": 0.29,
      "input_norm": 31.998104591369632,
      "input_norm/layer0": 31.998104591369632,
      "learning_rate": 0.005,
      "loss": 2.1887,
      "max_norm": 157.656494140625,
      "max_norm/layer0": 157.656494140625,
      "mean_norm": 54.80296516418457,
      "mean_norm/layer0": 54.80296516418457,
      "multicode_k": 1,
      "output_norm": 22.194608500798537,
      "output_norm/layer0": 22.194608500798537,
      "step": 2950
    },
    {
      "MSE": 525.7639581807456,
      "MSE/layer0": 525.7639581807456,
      "dead_code_fraction": 0.28035,
      "dead_code_fraction/layer0": 0.28035,
      "epoch": 0.3,
      "input_norm": 31.998085311253874,
      "input_norm/layer0": 31.998085311253874,
      "learning_rate": 0.005,
      "loss": 2.1108,
      "max_norm": 159.0706787109375,
      "max_norm/layer0": 159.0706787109375,
      "mean_norm": 55.01374816894531,
      "mean_norm/layer0": 55.01374816894531,
      "multicode_k": 1,
      "output_norm": 22.19143549601236,
      "output_norm/layer0": 22.19143549601236,
      "step": 3000
    },
    {
      "epoch": 0.3,
      "eval_MSE/layer0": 524.9529532255765,
      "eval_accuracy": 0.5051228197488481,
      "eval_dead_code_fraction/layer0": 0.2809,
      "eval_input_norm/layer0": 31.998092802783354,
      "eval_loss": 2.126948595046997,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.207113418645122,
      "eval_runtime": 157.5523,
      "eval_samples_per_second": 29.343,
      "eval_steps_per_second": 1.834,
      "step": 3000
    },
    {
      "MSE": 525.49979405721,
      "MSE/layer0": 525.49979405721,
      "dead_code_fraction": 0.28015,
      "dead_code_fraction/layer0": 0.28015,
      "epoch": 0.3,
      "input_norm": 31.998098812103272,
      "input_norm/layer0": 31.998098812103272,
      "learning_rate": 0.005,
      "loss": 2.1814,
      "max_norm": 160.52183532714844,
      "max_norm/layer0": 160.52183532714844,
      "mean_norm": 55.21175575256348,
      "mean_norm/layer0": 55.21175575256348,
      "multicode_k": 1,
      "output_norm": 22.205291633605963,
      "output_norm/layer0": 22.205291633605963,
      "step": 3050
    },
    {
      "MSE": 525.1535092671712,
      "MSE/layer0": 525.1535092671712,
      "dead_code_fraction": 0.27915,
      "dead_code_fraction/layer0": 0.27915,
      "epoch": 0.31,
      "input_norm": 31.998094654083246,
      "input_norm/layer0": 31.998094654083246,
      "learning_rate": 0.005,
      "loss": 2.1228,
      "max_norm": 161.857666015625,
      "max_norm/layer0": 161.857666015625,
      "mean_norm": 55.42117881774902,
      "mean_norm/layer0": 55.42117881774902,
      "multicode_k": 1,
      "output_norm": 22.20783314704896,
      "output_norm/layer0": 22.20783314704896,
      "step": 3100
    },
    {
      "MSE": 524.7367662556965,
      "MSE/layer0": 524.7367662556965,
      "dead_code_fraction": 0.27865,
      "dead_code_fraction/layer0": 0.27865,
      "epoch": 0.32,
      "input_norm": 31.99810951550802,
      "input_norm/layer0": 31.99810951550802,
      "learning_rate": 0.005,
      "loss": 2.1582,
      "max_norm": 163.2421417236328,
      "max_norm/layer0": 163.2421417236328,
      "mean_norm": 55.61536979675293,
      "mean_norm/layer0": 55.61536979675293,
      "multicode_k": 1,
      "output_norm": 22.229626963933313,
      "output_norm/layer0": 22.229626963933313,
      "step": 3150
    },
    {
      "MSE": 523.2996738688151,
      "MSE/layer0": 523.2996738688151,
      "dead_code_fraction": 0.27935,
      "dead_code_fraction/layer0": 0.27935,
      "epoch": 0.32,
      "input_norm": 31.998107938766474,
      "input_norm/layer0": 31.998107938766474,
      "learning_rate": 0.005,
      "loss": 2.0913,
      "max_norm": 164.34832763671875,
      "max_norm/layer0": 164.34832763671875,
      "mean_norm": 55.82136154174805,
      "mean_norm/layer0": 55.82136154174805,
      "multicode_k": 1,
      "output_norm": 22.247861604690552,
      "output_norm/layer0": 22.247861604690552,
      "step": 3200
    },
    {
      "MSE": 524.0594484965007,
      "MSE/layer0": 524.0594484965007,
      "dead_code_fraction": 0.2756,
      "dead_code_fraction/layer0": 0.2756,
      "epoch": 0.33,
      "input_norm": 31.998120482762648,
      "input_norm/layer0": 31.998120482762648,
      "learning_rate": 0.005,
      "loss": 2.1073,
      "max_norm": 165.75938415527344,
      "max_norm/layer0": 165.75938415527344,
      "mean_norm": 56.010887145996094,
      "mean_norm/layer0": 56.010887145996094,
      "multicode_k": 1,
      "output_norm": 22.245831327438353,
      "output_norm/layer0": 22.245831327438353,
      "step": 3250
    },
    {
      "MSE": 525.364818725586,
      "MSE/layer0": 525.364818725586,
      "dead_code_fraction": 0.2756,
      "dead_code_fraction/layer0": 0.2756,
      "epoch": 0.33,
      "input_norm": 31.998132244745904,
      "input_norm/layer0": 31.998132244745904,
      "learning_rate": 0.005,
      "loss": 2.0807,
      "max_norm": 166.85643005371094,
      "max_norm/layer0": 166.85643005371094,
      "mean_norm": 56.187782287597656,
      "mean_norm/layer0": 56.187782287597656,
      "multicode_k": 1,
      "output_norm": 22.242043924331664,
      "output_norm/layer0": 22.242043924331664,
      "step": 3300
    },
    {
      "MSE": 523.8938673400878,
      "MSE/layer0": 523.8938673400878,
      "dead_code_fraction": 0.2733,
      "dead_code_fraction/layer0": 0.2733,
      "epoch": 0.34,
      "input_norm": 31.998154455820725,
      "input_norm/layer0": 31.998154455820725,
      "learning_rate": 0.005,
      "loss": 2.1234,
      "max_norm": 167.70089721679688,
      "max_norm/layer0": 167.70089721679688,
      "mean_norm": 56.36995506286621,
      "mean_norm/layer0": 56.36995506286621,
      "multicode_k": 1,
      "output_norm": 22.246343409220387,
      "output_norm/layer0": 22.246343409220387,
      "step": 3350
    },
    {
      "MSE": 522.7465829976402,
      "MSE/layer0": 522.7465829976402,
      "dead_code_fraction": 0.2741,
      "dead_code_fraction/layer0": 0.2741,
      "epoch": 0.34,
      "input_norm": 31.998157631556197,
      "input_norm/layer0": 31.998157631556197,
      "learning_rate": 0.005,
      "loss": 2.1138,
      "max_norm": 168.70301818847656,
      "max_norm/layer0": 168.70301818847656,
      "mean_norm": 56.55203437805176,
      "mean_norm/layer0": 56.55203437805176,
      "multicode_k": 1,
      "output_norm": 22.282327626546234,
      "output_norm/layer0": 22.282327626546234,
      "step": 3400
    },
    {
      "MSE": 522.0263201395671,
      "MSE/layer0": 522.0263201395671,
      "dead_code_fraction": 0.27335,
      "dead_code_fraction/layer0": 0.27335,
      "epoch": 0.34,
      "input_norm": 31.99815892855326,
      "input_norm/layer0": 31.99815892855326,
      "learning_rate": 0.005,
      "loss": 2.103,
      "max_norm": 169.3920135498047,
      "max_norm/layer0": 169.3920135498047,
      "mean_norm": 56.73575782775879,
      "mean_norm/layer0": 56.73575782775879,
      "multicode_k": 1,
      "output_norm": 22.29100898424786,
      "output_norm/layer0": 22.29100898424786,
      "step": 3450
    },
    {
      "MSE": 521.5609470621745,
      "MSE/layer0": 521.5609470621745,
      "dead_code_fraction": 0.27265,
      "dead_code_fraction/layer0": 0.27265,
      "epoch": 0.35,
      "input_norm": 31.99817145665487,
      "input_norm/layer0": 31.99817145665487,
      "learning_rate": 0.005,
      "loss": 2.1045,
      "max_norm": 170.13829040527344,
      "max_norm/layer0": 170.13829040527344,
      "mean_norm": 56.91371726989746,
      "mean_norm/layer0": 56.91371726989746,
      "multicode_k": 1,
      "output_norm": 22.309985055923462,
      "output_norm/layer0": 22.309985055923462,
      "step": 3500
    },
    {
      "epoch": 0.35,
      "eval_MSE/layer0": 523.0844207110149,
      "eval_accuracy": 0.5078879054512807,
      "eval_dead_code_fraction/layer0": 0.27345,
      "eval_input_norm/layer0": 31.998171135689724,
      "eval_loss": 2.1130311489105225,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.351890057112634,
      "eval_runtime": 158.0171,
      "eval_samples_per_second": 29.256,
      "eval_steps_per_second": 1.829,
      "step": 3500
    },
    {
      "MSE": 522.4261043294274,
      "MSE/layer0": 522.4261043294274,
      "dead_code_fraction": 0.27245,
      "dead_code_fraction/layer0": 0.27245,
      "epoch": 0.35,
      "input_norm": 31.998184868494675,
      "input_norm/layer0": 31.998184868494675,
      "learning_rate": 0.005,
      "loss": 2.1296,
      "max_norm": 171.21067810058594,
      "max_norm/layer0": 171.21067810058594,
      "mean_norm": 57.08243370056152,
      "mean_norm/layer0": 57.08243370056152,
      "multicode_k": 1,
      "output_norm": 22.307131767272942,
      "output_norm/layer0": 22.307131767272942,
      "step": 3550
    },
    {
      "MSE": 520.5630591837569,
      "MSE/layer0": 520.5630591837569,
      "dead_code_fraction": 0.2715,
      "dead_code_fraction/layer0": 0.2715,
      "epoch": 0.36,
      "input_norm": 31.998175201416018,
      "input_norm/layer0": 31.998175201416018,
      "learning_rate": 0.005,
      "loss": 2.0606,
      "max_norm": 172.018798828125,
      "max_norm/layer0": 172.018798828125,
      "mean_norm": 57.259552001953125,
      "mean_norm/layer0": 57.259552001953125,
      "multicode_k": 1,
      "output_norm": 22.33381741523742,
      "output_norm/layer0": 22.33381741523742,
      "step": 3600
    },
    {
      "MSE": 521.8190139770511,
      "MSE/layer0": 521.8190139770511,
      "dead_code_fraction": 0.26915,
      "dead_code_fraction/layer0": 0.26915,
      "epoch": 0.36,
      "input_norm": 31.998206920623783,
      "input_norm/layer0": 31.998206920623783,
      "learning_rate": 0.005,
      "loss": 2.1264,
      "max_norm": 173.08360290527344,
      "max_norm/layer0": 173.08360290527344,
      "mean_norm": 57.425479888916016,
      "mean_norm/layer0": 57.425479888916016,
      "multicode_k": 1,
      "output_norm": 22.321163501739488,
      "output_norm/layer0": 22.321163501739488,
      "step": 3650
    },
    {
      "MSE": 520.2701113382976,
      "MSE/layer0": 520.2701113382976,
      "dead_code_fraction": 0.26935,
      "dead_code_fraction/layer0": 0.26935,
      "epoch": 0.37,
      "input_norm": 31.99821238517761,
      "input_norm/layer0": 31.99821238517761,
      "learning_rate": 0.005,
      "loss": 2.1028,
      "max_norm": 174.31561279296875,
      "max_norm/layer0": 174.31561279296875,
      "mean_norm": 57.58916091918945,
      "mean_norm/layer0": 57.58916091918945,
      "multicode_k": 1,
      "output_norm": 22.34191367149354,
      "output_norm/layer0": 22.34191367149354,
      "step": 3700
    },
    {
      "MSE": 520.4189120992024,
      "MSE/layer0": 520.4189120992024,
      "dead_code_fraction": 0.26865,
      "dead_code_fraction/layer0": 0.26865,
      "epoch": 0.38,
      "input_norm": 31.99821661313375,
      "input_norm/layer0": 31.99821661313375,
      "learning_rate": 0.005,
      "loss": 2.106,
      "max_norm": 175.09739685058594,
      "max_norm/layer0": 175.09739685058594,
      "mean_norm": 57.75008010864258,
      "mean_norm/layer0": 57.75008010864258,
      "multicode_k": 1,
      "output_norm": 22.352550570170077,
      "output_norm/layer0": 22.352550570170077,
      "step": 3750
    },
    {
      "MSE": 520.3332616170245,
      "MSE/layer0": 520.3332616170245,
      "dead_code_fraction": 0.2705,
      "dead_code_fraction/layer0": 0.2705,
      "epoch": 0.38,
      "input_norm": 31.998228356043505,
      "input_norm/layer0": 31.998228356043505,
      "learning_rate": 0.005,
      "loss": 2.1318,
      "max_norm": 175.85955810546875,
      "max_norm/layer0": 175.85955810546875,
      "mean_norm": 57.9084529876709,
      "mean_norm/layer0": 57.9084529876709,
      "multicode_k": 1,
      "output_norm": 22.355525690714526,
      "output_norm/layer0": 22.355525690714526,
      "step": 3800
    },
    {
      "MSE": 519.1107161458334,
      "MSE/layer0": 519.1107161458334,
      "dead_code_fraction": 0.26585,
      "dead_code_fraction/layer0": 0.26585,
      "epoch": 0.39,
      "input_norm": 31.998228273391724,
      "input_norm/layer0": 31.998228273391724,
      "learning_rate": 0.005,
      "loss": 2.1063,
      "max_norm": 176.55845642089844,
      "max_norm/layer0": 176.55845642089844,
      "mean_norm": 58.0648193359375,
      "mean_norm/layer0": 58.0648193359375,
      "multicode_k": 1,
      "output_norm": 22.375479180018097,
      "output_norm/layer0": 22.375479180018097,
      "step": 3850
    },
    {
      "MSE": 520.279450937907,
      "MSE/layer0": 520.279450937907,
      "dead_code_fraction": 0.26475,
      "dead_code_fraction/layer0": 0.26475,
      "epoch": 0.39,
      "input_norm": 31.998248408635455,
      "input_norm/layer0": 31.998248408635455,
      "learning_rate": 0.005,
      "loss": 2.1158,
      "max_norm": 177.40316772460938,
      "max_norm/layer0": 177.40316772460938,
      "mean_norm": 58.21473693847656,
      "mean_norm/layer0": 58.21473693847656,
      "multicode_k": 1,
      "output_norm": 22.37501454989114,
      "output_norm/layer0": 22.37501454989114,
      "step": 3900
    },
    {
      "MSE": 520.3905441284179,
      "MSE/layer0": 520.3905441284179,
      "dead_code_fraction": 0.26645,
      "dead_code_fraction/layer0": 0.26645,
      "epoch": 0.4,
      "input_norm": 31.998255596160874,
      "input_norm/layer0": 31.998255596160874,
      "learning_rate": 0.005,
      "loss": 2.0919,
      "max_norm": 178.25682067871094,
      "max_norm/layer0": 178.25682067871094,
      "mean_norm": 58.36372947692871,
      "mean_norm/layer0": 58.36372947692871,
      "multicode_k": 1,
      "output_norm": 22.360030002593987,
      "output_norm/layer0": 22.360030002593987,
      "step": 3950
    },
    {
      "MSE": 520.0447977193196,
      "MSE/layer0": 520.0447977193196,
      "dead_code_fraction": 0.2638,
      "dead_code_fraction/layer0": 0.2638,
      "epoch": 0.4,
      "input_norm": 31.998260914484668,
      "input_norm/layer0": 31.998260914484668,
      "learning_rate": 0.005,
      "loss": 2.0944,
      "max_norm": 178.8519287109375,
      "max_norm/layer0": 178.8519287109375,
      "mean_norm": 58.51635932922363,
      "mean_norm/layer0": 58.51635932922363,
      "multicode_k": 1,
      "output_norm": 22.37334650675455,
      "output_norm/layer0": 22.37334650675455,
      "step": 4000
    },
    {
      "epoch": 0.4,
      "eval_MSE/layer0": 519.885230389297,
      "eval_accuracy": 0.5089345655588774,
      "eval_dead_code_fraction/layer0": 0.2655,
      "eval_input_norm/layer0": 31.998263675723535,
      "eval_loss": 2.0995683670043945,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.39302826134025,
      "eval_runtime": 158.5492,
      "eval_samples_per_second": 29.158,
      "eval_steps_per_second": 1.823,
      "step": 4000
    },
    {
      "MSE": 519.3041878255204,
      "MSE/layer0": 519.3041878255204,
      "dead_code_fraction": 0.2634,
      "dead_code_fraction/layer0": 0.2634,
      "epoch": 0.41,
      "input_norm": 31.998263047536216,
      "input_norm/layer0": 31.998263047536216,
      "learning_rate": 0.005,
      "loss": 2.0844,
      "max_norm": 179.35386657714844,
      "max_norm/layer0": 179.35386657714844,
      "mean_norm": 58.670223236083984,
      "mean_norm/layer0": 58.670223236083984,
      "multicode_k": 1,
      "output_norm": 22.375990848541264,
      "output_norm/layer0": 22.375990848541264,
      "step": 4050
    },
    {
      "MSE": 520.2196419270836,
      "MSE/layer0": 520.2196419270836,
      "dead_code_fraction": 0.2615,
      "dead_code_fraction/layer0": 0.2615,
      "epoch": 0.41,
      "input_norm": 31.99826691627503,
      "input_norm/layer0": 31.99826691627503,
      "learning_rate": 0.005,
      "loss": 2.0983,
      "max_norm": 179.91224670410156,
      "max_norm/layer0": 179.91224670410156,
      "mean_norm": 58.826820373535156,
      "mean_norm/layer0": 58.826820373535156,
      "multicode_k": 1,
      "output_norm": 22.372630256017054,
      "output_norm/layer0": 22.372630256017054,
      "step": 4100
    },
    {
      "MSE": 519.6039750162761,
      "MSE/layer0": 519.6039750162761,
      "dead_code_fraction": 0.26085,
      "dead_code_fraction/layer0": 0.26085,
      "epoch": 0.41,
      "input_norm": 31.998284708658858,
      "input_norm/layer0": 31.998284708658858,
      "learning_rate": 0.005,
      "loss": 2.0974,
      "max_norm": 180.4697265625,
      "max_norm/layer0": 180.4697265625,
      "mean_norm": 58.97820472717285,
      "mean_norm/layer0": 58.97820472717285,
      "multicode_k": 1,
      "output_norm": 22.377655258178706,
      "output_norm/layer0": 22.377655258178706,
      "step": 4150
    },
    {
      "MSE": 518.396603800456,
      "MSE/layer0": 518.396603800456,
      "dead_code_fraction": 0.26145,
      "dead_code_fraction/layer0": 0.26145,
      "epoch": 0.42,
      "input_norm": 31.998291470209757,
      "input_norm/layer0": 31.998291470209757,
      "learning_rate": 0.005,
      "loss": 2.1155,
      "max_norm": 180.8781280517578,
      "max_norm/layer0": 180.8781280517578,
      "mean_norm": 59.12506866455078,
      "mean_norm/layer0": 59.12506866455078,
      "multicode_k": 1,
      "output_norm": 22.407741336822514,
      "output_norm/layer0": 22.407741336822514,
      "step": 4200
    },
    {
      "MSE": 518.4843705240887,
      "MSE/layer0": 518.4843705240887,
      "dead_code_fraction": 0.2605,
      "dead_code_fraction/layer0": 0.2605,
      "epoch": 0.42,
      "input_norm": 31.99829554239909,
      "input_norm/layer0": 31.99829554239909,
      "learning_rate": 0.005,
      "loss": 2.1004,
      "max_norm": 181.51483154296875,
      "max_norm/layer0": 181.51483154296875,
      "mean_norm": 59.271942138671875,
      "mean_norm/layer0": 59.271942138671875,
      "multicode_k": 1,
      "output_norm": 22.40968936284383,
      "output_norm/layer0": 22.40968936284383,
      "step": 4250
    },
    {
      "MSE": 518.0018126932782,
      "MSE/layer0": 518.0018126932782,
      "dead_code_fraction": 0.2586,
      "dead_code_fraction/layer0": 0.2586,
      "epoch": 0.43,
      "input_norm": 31.998309599558517,
      "input_norm/layer0": 31.998309599558517,
      "learning_rate": 0.005,
      "loss": 2.0848,
      "max_norm": 181.8904266357422,
      "max_norm/layer0": 181.8904266357422,
      "mean_norm": 59.40836715698242,
      "mean_norm/layer0": 59.40836715698242,
      "multicode_k": 1,
      "output_norm": 22.42666608492533,
      "output_norm/layer0": 22.42666608492533,
      "step": 4300
    },
    {
      "MSE": 518.2576261901858,
      "MSE/layer0": 518.2576261901858,
      "dead_code_fraction": 0.25825,
      "dead_code_fraction/layer0": 0.25825,
      "epoch": 0.43,
      "input_norm": 31.99831358591716,
      "input_norm/layer0": 31.99831358591716,
      "learning_rate": 0.005,
      "loss": 2.0778,
      "max_norm": 182.52023315429688,
      "max_norm/layer0": 182.52023315429688,
      "mean_norm": 59.546592712402344,
      "mean_norm/layer0": 59.546592712402344,
      "multicode_k": 1,
      "output_norm": 22.415684442520128,
      "output_norm/layer0": 22.415684442520128,
      "step": 4350
    },
    {
      "MSE": 517.176724141439,
      "MSE/layer0": 517.176724141439,
      "dead_code_fraction": 0.25845,
      "dead_code_fraction/layer0": 0.25845,
      "epoch": 0.44,
      "input_norm": 31.998328673044824,
      "input_norm/layer0": 31.998328673044824,
      "learning_rate": 0.005,
      "loss": 2.0989,
      "max_norm": 183.30308532714844,
      "max_norm/layer0": 183.30308532714844,
      "mean_norm": 59.680843353271484,
      "mean_norm/layer0": 59.680843353271484,
      "multicode_k": 1,
      "output_norm": 22.435629587173473,
      "output_norm/layer0": 22.435629587173473,
      "step": 4400
    },
    {
      "MSE": 516.945845082601,
      "MSE/layer0": 516.945845082601,
      "dead_code_fraction": 0.2589,
      "dead_code_fraction/layer0": 0.2589,
      "epoch": 0.45,
      "input_norm": 31.998329006830847,
      "input_norm/layer0": 31.998329006830847,
      "learning_rate": 0.005,
      "loss": 2.087,
      "max_norm": 184.17068481445312,
      "max_norm/layer0": 184.17068481445312,
      "mean_norm": 59.81003379821777,
      "mean_norm/layer0": 59.81003379821777,
      "multicode_k": 1,
      "output_norm": 22.447185754775994,
      "output_norm/layer0": 22.447185754775994,
      "step": 4450
    },
    {
      "MSE": 517.1110377502445,
      "MSE/layer0": 517.1110377502445,
      "dead_code_fraction": 0.25715,
      "dead_code_fraction/layer0": 0.25715,
      "epoch": 0.45,
      "input_norm": 31.998346713384,
      "input_norm/layer0": 31.998346713384,
      "learning_rate": 0.005,
      "loss": 2.1314,
      "max_norm": 185.53944396972656,
      "max_norm/layer0": 185.53944396972656,
      "mean_norm": 59.940223693847656,
      "mean_norm/layer0": 59.940223693847656,
      "multicode_k": 1,
      "output_norm": 22.444066270192472,
      "output_norm/layer0": 22.444066270192472,
      "step": 4500
    },
    {
      "epoch": 0.45,
      "eval_MSE/layer0": 517.038530914551,
      "eval_accuracy": 0.5114514130862962,
      "eval_dead_code_fraction/layer0": 0.25675,
      "eval_input_norm/layer0": 31.998349543131468,
      "eval_loss": 2.0859904289245605,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.471955899059722,
      "eval_runtime": 158.2677,
      "eval_samples_per_second": 29.21,
      "eval_steps_per_second": 1.826,
      "step": 4500
    },
    {
      "MSE": 516.5108834838866,
      "MSE/layer0": 516.5108834838866,
      "dead_code_fraction": 0.2556,
      "dead_code_fraction/layer0": 0.2556,
      "epoch": 0.46,
      "input_norm": 31.99834162076315,
      "input_norm/layer0": 31.99834162076315,
      "learning_rate": 0.005,
      "loss": 2.0594,
      "max_norm": 186.7916259765625,
      "max_norm/layer0": 186.7916259765625,
      "mean_norm": 60.06948661804199,
      "mean_norm/layer0": 60.06948661804199,
      "multicode_k": 1,
      "output_norm": 22.45672461509705,
      "output_norm/layer0": 22.45672461509705,
      "step": 4550
    },
    {
      "MSE": 517.5840914408367,
      "MSE/layer0": 517.5840914408367,
      "dead_code_fraction": 0.25275,
      "dead_code_fraction/layer0": 0.25275,
      "epoch": 0.46,
      "input_norm": 31.998361612955726,
      "input_norm/layer0": 31.998361612955726,
      "learning_rate": 0.005,
      "loss": 2.116,
      "max_norm": 187.44607543945312,
      "max_norm/layer0": 187.44607543945312,
      "mean_norm": 60.1932258605957,
      "mean_norm/layer0": 60.1932258605957,
      "multicode_k": 1,
      "output_norm": 22.445463349024458,
      "output_norm/layer0": 22.445463349024458,
      "step": 4600
    },
    {
      "MSE": 515.9212077331542,
      "MSE/layer0": 515.9212077331542,
      "dead_code_fraction": 0.2549,
      "dead_code_fraction/layer0": 0.2549,
      "epoch": 0.47,
      "input_norm": 31.998358809153245,
      "input_norm/layer0": 31.998358809153245,
      "learning_rate": 0.005,
      "loss": 2.0851,
      "max_norm": 187.99063110351562,
      "max_norm/layer0": 187.99063110351562,
      "mean_norm": 60.3179931640625,
      "mean_norm/layer0": 60.3179931640625,
      "multicode_k": 1,
      "output_norm": 22.468881686528533,
      "output_norm/layer0": 22.468881686528533,
      "step": 4650
    },
    {
      "MSE": 516.2712020365398,
      "MSE/layer0": 516.2712020365398,
      "dead_code_fraction": 0.2539,
      "dead_code_fraction/layer0": 0.2539,
      "epoch": 0.47,
      "input_norm": 31.99836943308513,
      "input_norm/layer0": 31.99836943308513,
      "learning_rate": 0.005,
      "loss": 2.0646,
      "max_norm": 188.7075653076172,
      "max_norm/layer0": 188.7075653076172,
      "mean_norm": 60.442317962646484,
      "mean_norm/layer0": 60.442317962646484,
      "multicode_k": 1,
      "output_norm": 22.458747002283737,
      "output_norm/layer0": 22.458747002283737,
      "step": 4700
    },
    {
      "MSE": 515.2177518717448,
      "MSE/layer0": 515.2177518717448,
      "dead_code_fraction": 0.25225,
      "dead_code_fraction/layer0": 0.25225,
      "epoch": 0.47,
      "input_norm": 31.99837938944498,
      "input_norm/layer0": 31.99837938944498,
      "learning_rate": 0.005,
      "loss": 2.0508,
      "max_norm": 189.4132080078125,
      "max_norm/layer0": 189.4132080078125,
      "mean_norm": 60.56760787963867,
      "mean_norm/layer0": 60.56760787963867,
      "multicode_k": 1,
      "output_norm": 22.48432564417522,
      "output_norm/layer0": 22.48432564417522,
      "step": 4750
    },
    {
      "MSE": 517.7876967760659,
      "MSE/layer0": 517.7876967760659,
      "dead_code_fraction": 0.2504,
      "dead_code_fraction/layer0": 0.2504,
      "epoch": 1.0,
      "input_norm": 31.998372135461928,
      "input_norm/layer0": 31.998372135461928,
      "learning_rate": 0.005,
      "loss": 2.0347,
      "max_norm": 189.93084716796875,
      "max_norm/layer0": 189.93084716796875,
      "mean_norm": 60.689674377441406,
      "mean_norm/layer0": 60.689674377441406,
      "multicode_k": 1,
      "output_norm": 22.4315491425679,
      "output_norm/layer0": 22.4315491425679,
      "step": 4800
    },
    {
      "MSE": 515.4498620096845,
      "MSE/layer0": 515.4498620096845,
      "dead_code_fraction": 0.2505,
      "dead_code_fraction/layer0": 0.2505,
      "epoch": 1.01,
      "input_norm": 31.998399356206253,
      "input_norm/layer0": 31.998399356206253,
      "learning_rate": 0.005,
      "loss": 2.1351,
      "max_norm": 190.8528289794922,
      "max_norm/layer0": 190.8528289794922,
      "mean_norm": 60.80255126953125,
      "mean_norm/layer0": 60.80255126953125,
      "multicode_k": 1,
      "output_norm": 22.488870484034226,
      "output_norm/layer0": 22.488870484034226,
      "step": 4850
    },
    {
      "MSE": 515.1998943074543,
      "MSE/layer0": 515.1998943074543,
      "dead_code_fraction": 0.24975,
      "dead_code_fraction/layer0": 0.24975,
      "epoch": 1.01,
      "input_norm": 31.998391094207765,
      "input_norm/layer0": 31.998391094207765,
      "learning_rate": 0.005,
      "loss": 2.0344,
      "max_norm": 191.88272094726562,
      "max_norm/layer0": 191.88272094726562,
      "mean_norm": 60.923635482788086,
      "mean_norm/layer0": 60.923635482788086,
      "multicode_k": 1,
      "output_norm": 22.493143533070885,
      "output_norm/layer0": 22.493143533070885,
      "step": 4900
    },
    {
      "MSE": 516.1670984395346,
      "MSE/layer0": 516.1670984395346,
      "dead_code_fraction": 0.2478,
      "dead_code_fraction/layer0": 0.2478,
      "epoch": 1.02,
      "input_norm": 31.99841277122497,
      "input_norm/layer0": 31.99841277122497,
      "learning_rate": 0.005,
      "loss": 2.0591,
      "max_norm": 192.84405517578125,
      "max_norm/layer0": 192.84405517578125,
      "mean_norm": 61.04226303100586,
      "mean_norm/layer0": 61.04226303100586,
      "multicode_k": 1,
      "output_norm": 22.47217222531637,
      "output_norm/layer0": 22.47217222531637,
      "step": 4950
    },
    {
      "MSE": 515.1936482747396,
      "MSE/layer0": 515.1936482747396,
      "dead_code_fraction": 0.2468,
      "dead_code_fraction/layer0": 0.2468,
      "epoch": 1.02,
      "input_norm": 31.998419497807816,
      "input_norm/layer0": 31.998419497807816,
      "learning_rate": 0.005,
      "loss": 2.0685,
      "max_norm": 193.819580078125,
      "max_norm/layer0": 193.819580078125,
      "mean_norm": 61.15685844421387,
      "mean_norm/layer0": 61.15685844421387,
      "multicode_k": 1,
      "output_norm": 22.499980732599887,
      "output_norm/layer0": 22.499980732599887,
      "step": 5000
    },
    {
      "epoch": 1.02,
      "eval_MSE/layer0": 514.3711726943474,
      "eval_accuracy": 0.5131406590660113,
      "eval_dead_code_fraction/layer0": 0.24975,
      "eval_input_norm/layer0": 31.998424857410036,
      "eval_loss": 2.076988458633423,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.494330299537523,
      "eval_runtime": 157.9418,
      "eval_samples_per_second": 29.27,
      "eval_steps_per_second": 1.83,
      "step": 5000
    },
    {
      "MSE": 515.1962452189127,
      "MSE/layer0": 515.1962452189127,
      "dead_code_fraction": 0.24585,
      "dead_code_fraction/layer0": 0.24585,
      "epoch": 1.03,
      "input_norm": 31.998427387873342,
      "input_norm/layer0": 31.998427387873342,
      "learning_rate": 0.005,
      "loss": 2.07,
      "max_norm": 194.8584442138672,
      "max_norm/layer0": 194.8584442138672,
      "mean_norm": 61.2799015045166,
      "mean_norm/layer0": 61.2799015045166,
      "multicode_k": 1,
      "output_norm": 22.492868417104084,
      "output_norm/layer0": 22.492868417104084,
      "step": 5050
    },
    {
      "MSE": 514.6688102722171,
      "MSE/layer0": 514.6688102722171,
      "dead_code_fraction": 0.24495,
      "dead_code_fraction/layer0": 0.24495,
      "epoch": 1.03,
      "input_norm": 31.99842824935913,
      "input_norm/layer0": 31.99842824935913,
      "learning_rate": 0.005,
      "loss": 2.0308,
      "max_norm": 195.33718872070312,
      "max_norm/layer0": 195.33718872070312,
      "mean_norm": 61.397443771362305,
      "mean_norm/layer0": 61.397443771362305,
      "multicode_k": 1,
      "output_norm": 22.502648471196487,
      "output_norm/layer0": 22.502648471196487,
      "step": 5100
    },
    {
      "MSE": 515.46877843221,
      "MSE/layer0": 515.46877843221,
      "dead_code_fraction": 0.2426,
      "dead_code_fraction/layer0": 0.2426,
      "epoch": 1.04,
      "input_norm": 31.998430423736572,
      "input_norm/layer0": 31.998430423736572,
      "learning_rate": 0.005,
      "loss": 2.0427,
      "max_norm": 195.8143310546875,
      "max_norm/layer0": 195.8143310546875,
      "mean_norm": 61.51255416870117,
      "mean_norm/layer0": 61.51255416870117,
      "multicode_k": 1,
      "output_norm": 22.500031328201295,
      "output_norm/layer0": 22.500031328201295,
      "step": 5150
    },
    {
      "MSE": 515.1060639953612,
      "MSE/layer0": 515.1060639953612,
      "dead_code_fraction": 0.2439,
      "dead_code_fraction/layer0": 0.2439,
      "epoch": 1.04,
      "input_norm": 31.998455877304075,
      "input_norm/layer0": 31.998455877304075,
      "learning_rate": 0.005,
      "loss": 2.1036,
      "max_norm": 196.40415954589844,
      "max_norm/layer0": 196.40415954589844,
      "mean_norm": 61.620216369628906,
      "mean_norm/layer0": 61.620216369628906,
      "multicode_k": 1,
      "output_norm": 22.504082736968975,
      "output_norm/layer0": 22.504082736968975,
      "step": 5200
    },
    {
      "MSE": 514.64603418986,
      "MSE/layer0": 514.64603418986,
      "dead_code_fraction": 0.24415,
      "dead_code_fraction/layer0": 0.24415,
      "epoch": 1.05,
      "input_norm": 31.99846438090008,
      "input_norm/layer0": 31.99846438090008,
      "learning_rate": 0.005,
      "loss": 2.1032,
      "max_norm": 197.31690979003906,
      "max_norm/layer0": 197.31690979003906,
      "mean_norm": 61.73128890991211,
      "mean_norm/layer0": 61.73128890991211,
      "multicode_k": 1,
      "output_norm": 22.51759773572286,
      "output_norm/layer0": 22.51759773572286,
      "step": 5250
    },
    {
      "MSE": 514.5095549011231,
      "MSE/layer0": 514.5095549011231,
      "dead_code_fraction": 0.24245,
      "dead_code_fraction/layer0": 0.24245,
      "epoch": 1.05,
      "input_norm": 31.998469727834063,
      "input_norm/layer0": 31.998469727834063,
      "learning_rate": 0.005,
      "loss": 2.0884,
      "max_norm": 198.30520629882812,
      "max_norm/layer0": 198.30520629882812,
      "mean_norm": 61.84503173828125,
      "mean_norm/layer0": 61.84503173828125,
      "multicode_k": 1,
      "output_norm": 22.52236960728964,
      "output_norm/layer0": 22.52236960728964,
      "step": 5300
    },
    {
      "MSE": 514.2185153198242,
      "MSE/layer0": 514.2185153198242,
      "dead_code_fraction": 0.2423,
      "dead_code_fraction/layer0": 0.2423,
      "epoch": 1.06,
      "input_norm": 31.99846864700317,
      "input_norm/layer0": 31.99846864700317,
      "learning_rate": 0.005,
      "loss": 2.0541,
      "max_norm": 198.76315307617188,
      "max_norm/layer0": 198.76315307617188,
      "mean_norm": 61.954532623291016,
      "mean_norm/layer0": 61.954532623291016,
      "multicode_k": 1,
      "output_norm": 22.523964621225986,
      "output_norm/layer0": 22.523964621225986,
      "step": 5350
    },
    {
      "MSE": 514.2201423136396,
      "MSE/layer0": 514.2201423136396,
      "dead_code_fraction": 0.24065,
      "dead_code_fraction/layer0": 0.24065,
      "epoch": 1.06,
      "input_norm": 31.99848121643067,
      "input_norm/layer0": 31.99848121643067,
      "learning_rate": 0.005,
      "loss": 2.0722,
      "max_norm": 199.5216522216797,
      "max_norm/layer0": 199.5216522216797,
      "mean_norm": 62.062015533447266,
      "mean_norm/layer0": 62.062015533447266,
      "multicode_k": 1,
      "output_norm": 22.529434289932254,
      "output_norm/layer0": 22.529434289932254,
      "step": 5400
    },
    {
      "MSE": 513.0346335347496,
      "MSE/layer0": 513.0346335347496,
      "dead_code_fraction": 0.2396,
      "dead_code_fraction/layer0": 0.2396,
      "epoch": 1.07,
      "input_norm": 31.998482402165727,
      "input_norm/layer0": 31.998482402165727,
      "learning_rate": 0.005,
      "loss": 2.0839,
      "max_norm": 199.89144897460938,
      "max_norm/layer0": 199.89144897460938,
      "mean_norm": 62.16894721984863,
      "mean_norm/layer0": 62.16894721984863,
      "multicode_k": 1,
      "output_norm": 22.549472332000725,
      "output_norm/layer0": 22.549472332000725,
      "step": 5450
    },
    {
      "MSE": 512.9845250447588,
      "MSE/layer0": 512.9845250447588,
      "dead_code_fraction": 0.23995,
      "dead_code_fraction/layer0": 0.23995,
      "epoch": 1.07,
      "input_norm": 31.99848415692648,
      "input_norm/layer0": 31.99848415692648,
      "learning_rate": 0.005,
      "loss": 2.0496,
      "max_norm": 200.10585021972656,
      "max_norm/layer0": 200.10585021972656,
      "mean_norm": 62.28166961669922,
      "mean_norm/layer0": 62.28166961669922,
      "multicode_k": 1,
      "output_norm": 22.535003283818554,
      "output_norm/layer0": 22.535003283818554,
      "step": 5500
    },
    {
      "epoch": 1.07,
      "eval_MSE/layer0": 513.7822700020247,
      "eval_accuracy": 0.5137449731240944,
      "eval_dead_code_fraction/layer0": 0.23805,
      "eval_input_norm/layer0": 31.998499035448475,
      "eval_loss": 2.0730204582214355,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.562518398921107,
      "eval_runtime": 158.2513,
      "eval_samples_per_second": 29.213,
      "eval_steps_per_second": 1.826,
      "step": 5500
    },
    {
      "MSE": 513.4142807515464,
      "MSE/layer0": 513.4142807515464,
      "dead_code_fraction": 0.2388,
      "dead_code_fraction/layer0": 0.2388,
      "epoch": 1.08,
      "input_norm": 31.99849408785501,
      "input_norm/layer0": 31.99849408785501,
      "learning_rate": 0.005,
      "loss": 2.0918,
      "max_norm": 200.3399200439453,
      "max_norm/layer0": 200.3399200439453,
      "mean_norm": 62.38692855834961,
      "mean_norm/layer0": 62.38692855834961,
      "multicode_k": 1,
      "output_norm": 22.54020097732544,
      "output_norm/layer0": 22.54020097732544,
      "step": 5550
    },
    {
      "MSE": 512.2161093648273,
      "MSE/layer0": 512.2161093648273,
      "dead_code_fraction": 0.23455,
      "dead_code_fraction/layer0": 0.23455,
      "epoch": 1.08,
      "input_norm": 31.998499333063755,
      "input_norm/layer0": 31.998499333063755,
      "learning_rate": 0.005,
      "loss": 2.0812,
      "max_norm": 200.90451049804688,
      "max_norm/layer0": 200.90451049804688,
      "mean_norm": 62.49030685424805,
      "mean_norm/layer0": 62.49030685424805,
      "multicode_k": 1,
      "output_norm": 22.562892615000422,
      "output_norm/layer0": 22.562892615000422,
      "step": 5600
    },
    {
      "MSE": 513.2079597473146,
      "MSE/layer0": 513.2079597473146,
      "dead_code_fraction": 0.2364,
      "dead_code_fraction/layer0": 0.2364,
      "epoch": 1.09,
      "input_norm": 31.998499097824094,
      "input_norm/layer0": 31.998499097824094,
      "learning_rate": 0.005,
      "loss": 2.0405,
      "max_norm": 201.2469940185547,
      "max_norm/layer0": 201.2469940185547,
      "mean_norm": 62.587249755859375,
      "mean_norm/layer0": 62.587249755859375,
      "multicode_k": 1,
      "output_norm": 22.551958309809354,
      "output_norm/layer0": 22.551958309809354,
      "step": 5650
    },
    {
      "MSE": 512.3663133748375,
      "MSE/layer0": 512.3663133748375,
      "dead_code_fraction": 0.2359,
      "dead_code_fraction/layer0": 0.2359,
      "epoch": 1.09,
      "input_norm": 31.998522087732937,
      "input_norm/layer0": 31.998522087732937,
      "learning_rate": 0.005,
      "loss": 2.0976,
      "max_norm": 202.06686401367188,
      "max_norm/layer0": 202.06686401367188,
      "mean_norm": 62.68406677246094,
      "mean_norm/layer0": 62.68406677246094,
      "multicode_k": 1,
      "output_norm": 22.56861629168192,
      "output_norm/layer0": 22.56861629168192,
      "step": 5700
    },
    {
      "MSE": 513.556918741862,
      "MSE/layer0": 513.556918741862,
      "dead_code_fraction": 0.2325,
      "dead_code_fraction/layer0": 0.2325,
      "epoch": 1.1,
      "input_norm": 31.99852702458699,
      "input_norm/layer0": 31.99852702458699,
      "learning_rate": 0.005,
      "loss": 2.0531,
      "max_norm": 202.5853729248047,
      "max_norm/layer0": 202.5853729248047,
      "mean_norm": 62.78022766113281,
      "mean_norm/layer0": 62.78022766113281,
      "multicode_k": 1,
      "output_norm": 22.55354828198752,
      "output_norm/layer0": 22.55354828198752,
      "step": 5750
    },
    {
      "MSE": 514.1225356547038,
      "MSE/layer0": 514.1225356547038,
      "dead_code_fraction": 0.23125,
      "dead_code_fraction/layer0": 0.23125,
      "epoch": 1.1,
      "input_norm": 31.998530540466305,
      "input_norm/layer0": 31.998530540466305,
      "learning_rate": 0.005,
      "loss": 2.0333,
      "max_norm": 202.8258514404297,
      "max_norm/layer0": 202.8258514404297,
      "mean_norm": 62.881099700927734,
      "mean_norm/layer0": 62.881099700927734,
      "multicode_k": 1,
      "output_norm": 22.538857170740776,
      "output_norm/layer0": 22.538857170740776,
      "step": 5800
    },
    {
      "MSE": 512.891567026774,
      "MSE/layer0": 512.891567026774,
      "dead_code_fraction": 0.23305,
      "dead_code_fraction/layer0": 0.23305,
      "epoch": 1.11,
      "input_norm": 31.998542674382527,
      "input_norm/layer0": 31.998542674382527,
      "learning_rate": 0.005,
      "loss": 2.0894,
      "max_norm": 203.2826385498047,
      "max_norm/layer0": 203.2826385498047,
      "mean_norm": 62.98002815246582,
      "mean_norm/layer0": 62.98002815246582,
      "multicode_k": 1,
      "output_norm": 22.556459398269645,
      "output_norm/layer0": 22.556459398269645,
      "step": 5850
    },
    {
      "MSE": 512.6300255839031,
      "MSE/layer0": 512.6300255839031,
      "dead_code_fraction": 0.23175,
      "dead_code_fraction/layer0": 0.23175,
      "epoch": 1.11,
      "input_norm": 31.998538637161257,
      "input_norm/layer0": 31.998538637161257,
      "learning_rate": 0.005,
      "loss": 2.0371,
      "max_norm": 203.56114196777344,
      "max_norm/layer0": 203.56114196777344,
      "mean_norm": 63.085018157958984,
      "mean_norm/layer0": 63.085018157958984,
      "multicode_k": 1,
      "output_norm": 22.55499767621359,
      "output_norm/layer0": 22.55499767621359,
      "step": 5900
    },
    {
      "MSE": 512.6470455423993,
      "MSE/layer0": 512.6470455423993,
      "dead_code_fraction": 0.22945,
      "dead_code_fraction/layer0": 0.22945,
      "epoch": 1.12,
      "input_norm": 31.998542264302582,
      "input_norm/layer0": 31.998542264302582,
      "learning_rate": 0.005,
      "loss": 2.0693,
      "max_norm": 204.18482971191406,
      "max_norm/layer0": 204.18482971191406,
      "mean_norm": 63.186561584472656,
      "mean_norm/layer0": 63.186561584472656,
      "multicode_k": 1,
      "output_norm": 22.56271686236063,
      "output_norm/layer0": 22.56271686236063,
      "step": 5950
    },
    {
      "MSE": 512.2647941589354,
      "MSE/layer0": 512.2647941589354,
      "dead_code_fraction": 0.23005,
      "dead_code_fraction/layer0": 0.23005,
      "epoch": 1.12,
      "input_norm": 31.99855575561523,
      "input_norm/layer0": 31.99855575561523,
      "learning_rate": 0.005,
      "loss": 2.1002,
      "max_norm": 204.59375,
      "max_norm/layer0": 204.59375,
      "mean_norm": 63.287431716918945,
      "mean_norm/layer0": 63.287431716918945,
      "multicode_k": 1,
      "output_norm": 22.56941809654236,
      "output_norm/layer0": 22.56941809654236,
      "step": 6000
    },
    {
      "epoch": 1.12,
      "eval_MSE/layer0": 510.787595085063,
      "eval_accuracy": 0.5144414778502405,
      "eval_dead_code_fraction/layer0": 0.2305,
      "eval_input_norm/layer0": 31.998558920130655,
      "eval_loss": 2.0667405128479004,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.588203073708286,
      "eval_runtime": 158.1457,
      "eval_samples_per_second": 29.233,
      "eval_steps_per_second": 1.827,
      "step": 6000
    },
    {
      "MSE": 512.2951668802899,
      "MSE/layer0": 512.2951668802899,
      "dead_code_fraction": 0.2284,
      "dead_code_fraction/layer0": 0.2284,
      "epoch": 1.13,
      "input_norm": 31.998558203379314,
      "input_norm/layer0": 31.998558203379314,
      "learning_rate": 0.005,
      "loss": 2.0645,
      "max_norm": 205.16860961914062,
      "max_norm/layer0": 205.16860961914062,
      "mean_norm": 63.38333702087402,
      "mean_norm/layer0": 63.38333702087402,
      "multicode_k": 1,
      "output_norm": 22.570796213150032,
      "output_norm/layer0": 22.570796213150032,
      "step": 6050
    },
    {
      "MSE": 512.1381341044107,
      "MSE/layer0": 512.1381341044107,
      "dead_code_fraction": 0.22855,
      "dead_code_fraction/layer0": 0.22855,
      "epoch": 1.13,
      "input_norm": 31.99856172879537,
      "input_norm/layer0": 31.99856172879537,
      "learning_rate": 0.005,
      "loss": 2.0856,
      "max_norm": 205.37376403808594,
      "max_norm/layer0": 205.37376403808594,
      "mean_norm": 63.47422790527344,
      "mean_norm/layer0": 63.47422790527344,
      "multicode_k": 1,
      "output_norm": 22.58201634724934,
      "output_norm/layer0": 22.58201634724934,
      "step": 6100
    },
    {
      "MSE": 512.7539996846516,
      "MSE/layer0": 512.7539996846516,
      "dead_code_fraction": 0.22755,
      "dead_code_fraction/layer0": 0.22755,
      "epoch": 1.14,
      "input_norm": 31.99856161753337,
      "input_norm/layer0": 31.99856161753337,
      "learning_rate": 0.005,
      "loss": 2.0468,
      "max_norm": 205.76866149902344,
      "max_norm/layer0": 205.76866149902344,
      "mean_norm": 63.56420707702637,
      "mean_norm/layer0": 63.56420707702637,
      "multicode_k": 1,
      "output_norm": 22.575629208882646,
      "output_norm/layer0": 22.575629208882646,
      "step": 6150
    },
    {
      "MSE": 512.1215149434411,
      "MSE/layer0": 512.1215149434411,
      "dead_code_fraction": 0.2268,
      "dead_code_fraction/layer0": 0.2268,
      "epoch": 1.14,
      "input_norm": 31.998577674229928,
      "input_norm/layer0": 31.998577674229928,
      "learning_rate": 0.005,
      "loss": 2.0663,
      "max_norm": 206.54251098632812,
      "max_norm/layer0": 206.54251098632812,
      "mean_norm": 63.64880561828613,
      "mean_norm/layer0": 63.64880561828613,
      "multicode_k": 1,
      "output_norm": 22.58266611417133,
      "output_norm/layer0": 22.58266611417133,
      "step": 6200
    },
    {
      "MSE": 513.3685421752932,
      "MSE/layer0": 513.3685421752932,
      "dead_code_fraction": 0.22515,
      "dead_code_fraction/layer0": 0.22515,
      "epoch": 1.15,
      "input_norm": 31.998585720062266,
      "input_norm/layer0": 31.998585720062266,
      "learning_rate": 0.005,
      "loss": 2.0807,
      "max_norm": 207.23460388183594,
      "max_norm/layer0": 207.23460388183594,
      "mean_norm": 63.73150444030762,
      "mean_norm/layer0": 63.73150444030762,
      "multicode_k": 1,
      "output_norm": 22.574931882222508,
      "output_norm/layer0": 22.574931882222508,
      "step": 6250
    },
    {
      "MSE": 512.1649493916829,
      "MSE/layer0": 512.1649493916829,
      "dead_code_fraction": 0.2243,
      "dead_code_fraction/layer0": 0.2243,
      "epoch": 1.15,
      "input_norm": 31.99859083811442,
      "input_norm/layer0": 31.99859083811442,
      "learning_rate": 0.005,
      "loss": 1.9994,
      "max_norm": 207.4078826904297,
      "max_norm/layer0": 207.4078826904297,
      "mean_norm": 63.8239631652832,
      "mean_norm/layer0": 63.8239631652832,
      "multicode_k": 1,
      "output_norm": 22.573653513590493,
      "output_norm/layer0": 22.573653513590493,
      "step": 6300
    },
    {
      "MSE": 512.4084614054359,
      "MSE/layer0": 512.4084614054359,
      "dead_code_fraction": 0.22405,
      "dead_code_fraction/layer0": 0.22405,
      "epoch": 1.16,
      "input_norm": 31.998589369455978,
      "input_norm/layer0": 31.998589369455978,
      "learning_rate": 0.005,
      "loss": 2.0383,
      "max_norm": 207.421875,
      "max_norm/layer0": 207.421875,
      "mean_norm": 63.91918754577637,
      "mean_norm/layer0": 63.91918754577637,
      "multicode_k": 1,
      "output_norm": 22.570101757049564,
      "output_norm/layer0": 22.570101757049564,
      "step": 6350
    },
    {
      "MSE": 511.3037980651857,
      "MSE/layer0": 511.3037980651857,
      "dead_code_fraction": 0.22325,
      "dead_code_fraction/layer0": 0.22325,
      "epoch": 1.16,
      "input_norm": 31.9986056105296,
      "input_norm/layer0": 31.9986056105296,
      "learning_rate": 0.005,
      "loss": 2.0836,
      "max_norm": 207.90211486816406,
      "max_norm/layer0": 207.90211486816406,
      "mean_norm": 64.0091323852539,
      "mean_norm/layer0": 64.0091323852539,
      "multicode_k": 1,
      "output_norm": 22.591040735244757,
      "output_norm/layer0": 22.591040735244757,
      "step": 6400
    },
    {
      "MSE": 511.63349212646506,
      "MSE/layer0": 511.63349212646506,
      "dead_code_fraction": 0.2231,
      "dead_code_fraction/layer0": 0.2231,
      "epoch": 1.17,
      "input_norm": 31.998600152333573,
      "input_norm/layer0": 31.998600152333573,
      "learning_rate": 0.005,
      "loss": 2.049,
      "max_norm": 208.1908416748047,
      "max_norm/layer0": 208.1908416748047,
      "mean_norm": 64.09888458251953,
      "mean_norm/layer0": 64.09888458251953,
      "multicode_k": 1,
      "output_norm": 22.598680645624796,
      "output_norm/layer0": 22.598680645624796,
      "step": 6450
    },
    {
      "MSE": 510.1135516866045,
      "MSE/layer0": 510.1135516866045,
      "dead_code_fraction": 0.2198,
      "dead_code_fraction/layer0": 0.2198,
      "epoch": 1.17,
      "input_norm": 31.99861148198446,
      "input_norm/layer0": 31.99861148198446,
      "learning_rate": 0.005,
      "loss": 2.0723,
      "max_norm": 208.76829528808594,
      "max_norm/layer0": 208.76829528808594,
      "mean_norm": 64.1937198638916,
      "mean_norm/layer0": 64.1937198638916,
      "multicode_k": 1,
      "output_norm": 22.610935223897293,
      "output_norm/layer0": 22.610935223897293,
      "step": 6500
    },
    {
      "epoch": 1.17,
      "eval_MSE/layer0": 510.5624312578848,
      "eval_accuracy": 0.5148121435408701,
      "eval_dead_code_fraction/layer0": 0.2206,
      "eval_input_norm/layer0": 31.99861497196212,
      "eval_loss": 2.0631778240203857,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.613337997850753,
      "eval_runtime": 157.9752,
      "eval_samples_per_second": 29.264,
      "eval_steps_per_second": 1.829,
      "step": 6500
    },
    {
      "MSE": 511.1518494669597,
      "MSE/layer0": 511.1518494669597,
      "dead_code_fraction": 0.2202,
      "dead_code_fraction/layer0": 0.2202,
      "epoch": 1.18,
      "input_norm": 31.998620487848918,
      "input_norm/layer0": 31.998620487848918,
      "learning_rate": 0.005,
      "loss": 2.0713,
      "max_norm": 209.1894989013672,
      "max_norm/layer0": 209.1894989013672,
      "mean_norm": 64.28516006469727,
      "mean_norm/layer0": 64.28516006469727,
      "multicode_k": 1,
      "output_norm": 22.59137951215108,
      "output_norm/layer0": 22.59137951215108,
      "step": 6550
    },
    {
      "MSE": 511.4045928446453,
      "MSE/layer0": 511.4045928446453,
      "dead_code_fraction": 0.2177,
      "dead_code_fraction/layer0": 0.2177,
      "epoch": 1.18,
      "input_norm": 31.99861013412476,
      "input_norm/layer0": 31.99861013412476,
      "learning_rate": 0.005,
      "loss": 2.0067,
      "max_norm": 209.52085876464844,
      "max_norm/layer0": 209.52085876464844,
      "mean_norm": 64.37364196777344,
      "mean_norm/layer0": 64.37364196777344,
      "multicode_k": 1,
      "output_norm": 22.59921900431315,
      "output_norm/layer0": 22.59921900431315,
      "step": 6600
    },
    {
      "MSE": 510.8443921915694,
      "MSE/layer0": 510.8443921915694,
      "dead_code_fraction": 0.21885,
      "dead_code_fraction/layer0": 0.21885,
      "epoch": 1.19,
      "input_norm": 31.998613767623894,
      "input_norm/layer0": 31.998613767623894,
      "learning_rate": 0.005,
      "loss": 2.013,
      "max_norm": 209.98431396484375,
      "max_norm/layer0": 209.98431396484375,
      "mean_norm": 64.46432113647461,
      "mean_norm/layer0": 64.46432113647461,
      "multicode_k": 1,
      "output_norm": 22.60319686889649,
      "output_norm/layer0": 22.60319686889649,
      "step": 6650
    },
    {
      "MSE": 510.0460713704424,
      "MSE/layer0": 510.0460713704424,
      "dead_code_fraction": 0.2183,
      "dead_code_fraction/layer0": 0.2183,
      "epoch": 1.19,
      "input_norm": 31.998641831080132,
      "input_norm/layer0": 31.998641831080132,
      "learning_rate": 0.005,
      "loss": 2.1151,
      "max_norm": 210.53810119628906,
      "max_norm/layer0": 210.53810119628906,
      "mean_norm": 64.55224609375,
      "mean_norm/layer0": 64.55224609375,
      "multicode_k": 1,
      "output_norm": 22.621459808349613,
      "output_norm/layer0": 22.621459808349613,
      "step": 6700
    },
    {
      "MSE": 509.41305414835614,
      "MSE/layer0": 509.41305414835614,
      "dead_code_fraction": 0.2172,
      "dead_code_fraction/layer0": 0.2172,
      "epoch": 1.2,
      "input_norm": 31.998632535934448,
      "input_norm/layer0": 31.998632535934448,
      "learning_rate": 0.005,
      "loss": 2.0318,
      "max_norm": 210.88394165039062,
      "max_norm/layer0": 210.88394165039062,
      "mean_norm": 64.64096069335938,
      "mean_norm/layer0": 64.64096069335938,
      "multicode_k": 1,
      "output_norm": 22.626508464813227,
      "output_norm/layer0": 22.626508464813227,
      "step": 6750
    },
    {
      "MSE": 510.3878801981608,
      "MSE/layer0": 510.3878801981608,
      "dead_code_fraction": 0.21645,
      "dead_code_fraction/layer0": 0.21645,
      "epoch": 1.2,
      "input_norm": 31.998641300201413,
      "input_norm/layer0": 31.998641300201413,
      "learning_rate": 0.005,
      "loss": 2.0492,
      "max_norm": 211.13937377929688,
      "max_norm/layer0": 211.13937377929688,
      "mean_norm": 64.7227783203125,
      "mean_norm/layer0": 64.7227783203125,
      "multicode_k": 1,
      "output_norm": 22.63286488850911,
      "output_norm/layer0": 22.63286488850911,
      "step": 6800
    },
    {
      "MSE": 509.17419825236027,
      "MSE/layer0": 509.17419825236027,
      "dead_code_fraction": 0.2138,
      "dead_code_fraction/layer0": 0.2138,
      "epoch": 1.21,
      "input_norm": 31.998648115793856,
      "input_norm/layer0": 31.998648115793856,
      "learning_rate": 0.005,
      "loss": 2.0467,
      "max_norm": 211.3644256591797,
      "max_norm/layer0": 211.3644256591797,
      "mean_norm": 64.80514907836914,
      "mean_norm/layer0": 64.80514907836914,
      "multicode_k": 1,
      "output_norm": 22.63950007438659,
      "output_norm/layer0": 22.63950007438659,
      "step": 6850
    },
    {
      "MSE": 509.3450110371906,
      "MSE/layer0": 509.3450110371906,
      "dead_code_fraction": 0.2144,
      "dead_code_fraction/layer0": 0.2144,
      "epoch": 1.21,
      "input_norm": 31.998654368718455,
      "input_norm/layer0": 31.998654368718455,
      "learning_rate": 0.005,
      "loss": 2.0327,
      "max_norm": 211.51609802246094,
      "max_norm/layer0": 211.51609802246094,
      "mean_norm": 64.885498046875,
      "mean_norm/layer0": 64.885498046875,
      "multicode_k": 1,
      "output_norm": 22.636532586415615,
      "output_norm/layer0": 22.636532586415615,
      "step": 6900
    },
    {
      "MSE": 509.711417948405,
      "MSE/layer0": 509.711417948405,
      "dead_code_fraction": 0.2121,
      "dead_code_fraction/layer0": 0.2121,
      "epoch": 1.22,
      "input_norm": 31.998653659820555,
      "input_norm/layer0": 31.998653659820555,
      "learning_rate": 0.005,
      "loss": 2.0344,
      "max_norm": 211.93910217285156,
      "max_norm/layer0": 211.93910217285156,
      "mean_norm": 64.96215629577637,
      "mean_norm/layer0": 64.96215629577637,
      "multicode_k": 1,
      "output_norm": 22.642279275258375,
      "output_norm/layer0": 22.642279275258375,
      "step": 6950
    },
    {
      "MSE": 509.53209904988614,
      "MSE/layer0": 509.53209904988614,
      "dead_code_fraction": 0.2112,
      "dead_code_fraction/layer0": 0.2112,
      "epoch": 1.22,
      "input_norm": 31.99865920702616,
      "input_norm/layer0": 31.99865920702616,
      "learning_rate": 0.005,
      "loss": 2.023,
      "max_norm": 212.15188598632812,
      "max_norm/layer0": 212.15188598632812,
      "mean_norm": 65.03938484191895,
      "mean_norm/layer0": 65.03938484191895,
      "multicode_k": 1,
      "output_norm": 22.641168931325275,
      "output_norm/layer0": 22.641168931325275,
      "step": 7000
    },
    {
      "epoch": 1.22,
      "eval_MSE/layer0": 509.9877618207523,
      "eval_accuracy": 0.5156894350128739,
      "eval_dead_code_fraction/layer0": 0.21105,
      "eval_input_norm/layer0": 31.998664335077162,
      "eval_loss": 2.0573580265045166,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.65440880063548,
      "eval_runtime": 158.8251,
      "eval_samples_per_second": 29.107,
      "eval_steps_per_second": 1.82,
      "step": 7000
    },
    {
      "MSE": 509.9403240458172,
      "MSE/layer0": 509.9403240458172,
      "dead_code_fraction": 0.2101,
      "dead_code_fraction/layer0": 0.2101,
      "epoch": 1.23,
      "input_norm": 31.998663558959954,
      "input_norm/layer0": 31.998663558959954,
      "learning_rate": 0.005,
      "loss": 2.0391,
      "max_norm": 212.45599365234375,
      "max_norm/layer0": 212.45599365234375,
      "mean_norm": 65.11711883544922,
      "mean_norm/layer0": 65.11711883544922,
      "multicode_k": 1,
      "output_norm": 22.636152718861904,
      "output_norm/layer0": 22.636152718861904,
      "step": 7050
    },
    {
      "MSE": 509.17088083903013,
      "MSE/layer0": 509.17088083903013,
      "dead_code_fraction": 0.2099,
      "dead_code_fraction/layer0": 0.2099,
      "epoch": 1.23,
      "input_norm": 31.998674535751356,
      "input_norm/layer0": 31.998674535751356,
      "learning_rate": 0.005,
      "loss": 2.0413,
      "max_norm": 212.8926544189453,
      "max_norm/layer0": 212.8926544189453,
      "mean_norm": 65.19314002990723,
      "mean_norm/layer0": 65.19314002990723,
      "multicode_k": 1,
      "output_norm": 22.652867739995315,
      "output_norm/layer0": 22.652867739995315,
      "step": 7100
    },
    {
      "MSE": 509.09580220540397,
      "MSE/layer0": 509.09580220540397,
      "dead_code_fraction": 0.209,
      "dead_code_fraction/layer0": 0.209,
      "epoch": 1.24,
      "input_norm": 31.99867464383444,
      "input_norm/layer0": 31.99867464383444,
      "learning_rate": 0.005,
      "loss": 2.0495,
      "max_norm": 213.29238891601562,
      "max_norm/layer0": 213.29238891601562,
      "mean_norm": 65.27325248718262,
      "mean_norm/layer0": 65.27325248718262,
      "multicode_k": 1,
      "output_norm": 22.646062428156533,
      "output_norm/layer0": 22.646062428156533,
      "step": 7150
    },
    {
      "MSE": 509.9214274597167,
      "MSE/layer0": 509.9214274597167,
      "dead_code_fraction": 0.20905,
      "dead_code_fraction/layer0": 0.20905,
      "epoch": 1.24,
      "input_norm": 31.998673133850097,
      "input_norm/layer0": 31.998673133850097,
      "learning_rate": 0.005,
      "loss": 2.0462,
      "max_norm": 213.58729553222656,
      "max_norm/layer0": 213.58729553222656,
      "mean_norm": 65.35407447814941,
      "mean_norm/layer0": 65.35407447814941,
      "multicode_k": 1,
      "output_norm": 22.63937306404113,
      "output_norm/layer0": 22.63937306404113,
      "step": 7200
    },
    {
      "MSE": 508.71533091227207,
      "MSE/layer0": 508.71533091227207,
      "dead_code_fraction": 0.2082,
      "dead_code_fraction/layer0": 0.2082,
      "epoch": 1.25,
      "input_norm": 31.99868763287862,
      "input_norm/layer0": 31.99868763287862,
      "learning_rate": 0.005,
      "loss": 2.0582,
      "max_norm": 213.80873107910156,
      "max_norm/layer0": 213.80873107910156,
      "mean_norm": 65.43496131896973,
      "mean_norm/layer0": 65.43496131896973,
      "multicode_k": 1,
      "output_norm": 22.648734455108645,
      "output_norm/layer0": 22.648734455108645,
      "step": 7250
    },
    {
      "MSE": 507.686293182373,
      "MSE/layer0": 507.686293182373,
      "dead_code_fraction": 0.2066,
      "dead_code_fraction/layer0": 0.2066,
      "epoch": 1.25,
      "input_norm": 31.998690617879234,
      "input_norm/layer0": 31.998690617879234,
      "learning_rate": 0.005,
      "loss": 2.0485,
      "max_norm": 214.17088317871094,
      "max_norm/layer0": 214.17088317871094,
      "mean_norm": 65.51487731933594,
      "mean_norm/layer0": 65.51487731933594,
      "multicode_k": 1,
      "output_norm": 22.669575303395582,
      "output_norm/layer0": 22.669575303395582,
      "step": 7300
    },
    {
      "MSE": 507.97169540405275,
      "MSE/layer0": 507.97169540405275,
      "dead_code_fraction": 0.20445,
      "dead_code_fraction/layer0": 0.20445,
      "epoch": 1.26,
      "input_norm": 31.99869660695392,
      "input_norm/layer0": 31.99869660695392,
      "learning_rate": 0.005,
      "loss": 2.0534,
      "max_norm": 214.52955627441406,
      "max_norm/layer0": 214.52955627441406,
      "mean_norm": 65.59026718139648,
      "mean_norm/layer0": 65.59026718139648,
      "multicode_k": 1,
      "output_norm": 22.678728303909296,
      "output_norm/layer0": 22.678728303909296,
      "step": 7350
    },
    {
      "MSE": 507.6675502522787,
      "MSE/layer0": 507.6675502522787,
      "dead_code_fraction": 0.20485,
      "dead_code_fraction/layer0": 0.20485,
      "epoch": 1.26,
      "input_norm": 31.998699353535965,
      "input_norm/layer0": 31.998699353535965,
      "learning_rate": 0.005,
      "loss": 2.0638,
      "max_norm": 214.7173614501953,
      "max_norm/layer0": 214.7173614501953,
      "mean_norm": 65.67013740539551,
      "mean_norm/layer0": 65.67013740539551,
      "multicode_k": 1,
      "output_norm": 22.67898440043131,
      "output_norm/layer0": 22.67898440043131,
      "step": 7400
    },
    {
      "MSE": 507.85135843912786,
      "MSE/layer0": 507.85135843912786,
      "dead_code_fraction": 0.2049,
      "dead_code_fraction/layer0": 0.2049,
      "epoch": 1.27,
      "input_norm": 31.998699776331584,
      "input_norm/layer0": 31.998699776331584,
      "learning_rate": 0.005,
      "loss": 2.0353,
      "max_norm": 215.19158935546875,
      "max_norm/layer0": 215.19158935546875,
      "mean_norm": 65.75178337097168,
      "mean_norm/layer0": 65.75178337097168,
      "multicode_k": 1,
      "output_norm": 22.680205952326446,
      "output_norm/layer0": 22.680205952326446,
      "step": 7450
    },
    {
      "MSE": 507.253986562093,
      "MSE/layer0": 507.253986562093,
      "dead_code_fraction": 0.20435,
      "dead_code_fraction/layer0": 0.20435,
      "epoch": 1.27,
      "input_norm": 31.99870971679686,
      "input_norm/layer0": 31.99870971679686,
      "learning_rate": 0.005,
      "loss": 2.0791,
      "max_norm": 215.7554931640625,
      "max_norm/layer0": 215.7554931640625,
      "mean_norm": 65.82438659667969,
      "mean_norm/layer0": 65.82438659667969,
      "multicode_k": 1,
      "output_norm": 22.691158383687345,
      "output_norm/layer0": 22.691158383687345,
      "step": 7500
    },
    {
      "epoch": 1.27,
      "eval_MSE/layer0": 507.1513778155122,
      "eval_accuracy": 0.5167855735982843,
      "eval_dead_code_fraction/layer0": 0.2033,
      "eval_input_norm/layer0": 31.998707461867696,
      "eval_loss": 2.0513455867767334,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.70183411032355,
      "eval_runtime": 158.8151,
      "eval_samples_per_second": 29.109,
      "eval_steps_per_second": 1.82,
      "step": 7500
    },
    {
      "MSE": 508.0465566507977,
      "MSE/layer0": 508.0465566507977,
      "dead_code_fraction": 0.20265,
      "dead_code_fraction/layer0": 0.20265,
      "epoch": 1.28,
      "input_norm": 31.9987080860138,
      "input_norm/layer0": 31.9987080860138,
      "learning_rate": 0.005,
      "loss": 2.0357,
      "max_norm": 216.1879119873047,
      "max_norm/layer0": 216.1879119873047,
      "mean_norm": 65.89747428894043,
      "mean_norm/layer0": 65.89747428894043,
      "multicode_k": 1,
      "output_norm": 22.691229712168372,
      "output_norm/layer0": 22.691229712168372,
      "step": 7550
    },
    {
      "MSE": 506.86150853474936,
      "MSE/layer0": 506.86150853474936,
      "dead_code_fraction": 0.20235,
      "dead_code_fraction/layer0": 0.20235,
      "epoch": 1.28,
      "input_norm": 31.998724161783855,
      "input_norm/layer0": 31.998724161783855,
      "learning_rate": 0.005,
      "loss": 2.0643,
      "max_norm": 216.84507751464844,
      "max_norm/layer0": 216.84507751464844,
      "mean_norm": 65.96598243713379,
      "mean_norm/layer0": 65.96598243713379,
      "multicode_k": 1,
      "output_norm": 22.70548650105794,
      "output_norm/layer0": 22.70548650105794,
      "step": 7600
    },
    {
      "MSE": 508.52483596801756,
      "MSE/layer0": 508.52483596801756,
      "dead_code_fraction": 0.20115,
      "dead_code_fraction/layer0": 0.20115,
      "epoch": 1.29,
      "input_norm": 31.998720836639407,
      "input_norm/layer0": 31.998720836639407,
      "learning_rate": 0.005,
      "loss": 2.0331,
      "max_norm": 217.07077026367188,
      "max_norm/layer0": 217.07077026367188,
      "mean_norm": 66.04256629943848,
      "mean_norm/layer0": 66.04256629943848,
      "multicode_k": 1,
      "output_norm": 22.671403992970788,
      "output_norm/layer0": 22.671403992970788,
      "step": 7650
    },
    {
      "MSE": 506.7901182556151,
      "MSE/layer0": 506.7901182556151,
      "dead_code_fraction": 0.20025,
      "dead_code_fraction/layer0": 0.20025,
      "epoch": 1.29,
      "input_norm": 31.998723080952953,
      "input_norm/layer0": 31.998723080952953,
      "learning_rate": 0.005,
      "loss": 2.0643,
      "max_norm": 217.60621643066406,
      "max_norm/layer0": 217.60621643066406,
      "mean_norm": 66.1141586303711,
      "mean_norm/layer0": 66.1141586303711,
      "multicode_k": 1,
      "output_norm": 22.711970895131433,
      "output_norm/layer0": 22.711970895131433,
      "step": 7700
    },
    {
      "MSE": 506.4805715942383,
      "MSE/layer0": 506.4805715942383,
      "dead_code_fraction": 0.19955,
      "dead_code_fraction/layer0": 0.19955,
      "epoch": 1.3,
      "input_norm": 31.998739531834943,
      "input_norm/layer0": 31.998739531834943,
      "learning_rate": 0.005,
      "loss": 2.0999,
      "max_norm": 218.18724060058594,
      "max_norm/layer0": 218.18724060058594,
      "mean_norm": 66.18310356140137,
      "mean_norm/layer0": 66.18310356140137,
      "multicode_k": 1,
      "output_norm": 22.715899858474735,
      "output_norm/layer0": 22.715899858474735,
      "step": 7750
    },
    {
      "MSE": 507.79560877482083,
      "MSE/layer0": 507.79560877482083,
      "dead_code_fraction": 0.1983,
      "dead_code_fraction/layer0": 0.1983,
      "epoch": 1.3,
      "input_norm": 31.9987256272634,
      "input_norm/layer0": 31.9987256272634,
      "learning_rate": 0.005,
      "loss": 2.0143,
      "max_norm": 218.3722686767578,
      "max_norm/layer0": 218.3722686767578,
      "mean_norm": 66.25444984436035,
      "mean_norm/layer0": 66.25444984436035,
      "multicode_k": 1,
      "output_norm": 22.692439622879014,
      "output_norm/layer0": 22.692439622879014,
      "step": 7800
    },
    {
      "MSE": 507.2388439432779,
      "MSE/layer0": 507.2388439432779,
      "dead_code_fraction": 0.198,
      "dead_code_fraction/layer0": 0.198,
      "epoch": 1.31,
      "input_norm": 31.998735243479416,
      "input_norm/layer0": 31.998735243479416,
      "learning_rate": 0.005,
      "loss": 2.069,
      "max_norm": 218.93580627441406,
      "max_norm/layer0": 218.93580627441406,
      "mean_norm": 66.32441329956055,
      "mean_norm/layer0": 66.32441329956055,
      "multicode_k": 1,
      "output_norm": 22.703038584391276,
      "output_norm/layer0": 22.703038584391276,
      "step": 7850
    },
    {
      "MSE": 508.13961395263664,
      "MSE/layer0": 508.13961395263664,
      "dead_code_fraction": 0.19705,
      "dead_code_fraction/layer0": 0.19705,
      "epoch": 1.31,
      "input_norm": 31.99873922983806,
      "input_norm/layer0": 31.99873922983806,
      "learning_rate": 0.005,
      "loss": 2.0712,
      "max_norm": 219.51759338378906,
      "max_norm/layer0": 219.51759338378906,
      "mean_norm": 66.39589881896973,
      "mean_norm/layer0": 66.39589881896973,
      "multicode_k": 1,
      "output_norm": 22.68491499900817,
      "output_norm/layer0": 22.68491499900817,
      "step": 7900
    },
    {
      "MSE": 506.5046355692546,
      "MSE/layer0": 506.5046355692546,
      "dead_code_fraction": 0.1958,
      "dead_code_fraction/layer0": 0.1958,
      "epoch": 1.32,
      "input_norm": 31.998745075861606,
      "input_norm/layer0": 31.998745075861606,
      "learning_rate": 0.005,
      "loss": 2.0623,
      "max_norm": 220.1356658935547,
      "max_norm/layer0": 220.1356658935547,
      "mean_norm": 66.46616172790527,
      "mean_norm/layer0": 66.46616172790527,
      "multicode_k": 1,
      "output_norm": 22.709094810485844,
      "output_norm/layer0": 22.709094810485844,
      "step": 7950
    },
    {
      "MSE": 506.24584472656227,
      "MSE/layer0": 506.24584472656227,
      "dead_code_fraction": 0.1962,
      "dead_code_fraction/layer0": 0.1962,
      "epoch": 1.32,
      "input_norm": 31.998744071324662,
      "input_norm/layer0": 31.998744071324662,
      "learning_rate": 0.005,
      "loss": 2.0252,
      "max_norm": 220.52029418945312,
      "max_norm/layer0": 220.52029418945312,
      "mean_norm": 66.54170417785645,
      "mean_norm/layer0": 66.54170417785645,
      "multicode_k": 1,
      "output_norm": 22.71004734039306,
      "output_norm/layer0": 22.71004734039306,
      "step": 8000
    },
    {
      "epoch": 1.32,
      "eval_MSE/layer0": 505.2722684186489,
      "eval_accuracy": 0.5173414664109856,
      "eval_dead_code_fraction/layer0": 0.19525,
      "eval_input_norm/layer0": 31.998757950702117,
      "eval_loss": 2.046276569366455,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.71078164304668,
      "eval_runtime": 158.1298,
      "eval_samples_per_second": 29.235,
      "eval_steps_per_second": 1.828,
      "step": 8000
    },
    {
      "MSE": 507.15304565429676,
      "MSE/layer0": 507.15304565429676,
      "dead_code_fraction": 0.1941,
      "dead_code_fraction/layer0": 0.1941,
      "epoch": 1.33,
      "input_norm": 31.998751821517956,
      "input_norm/layer0": 31.998751821517956,
      "learning_rate": 0.005,
      "loss": 2.0231,
      "max_norm": 221.12425231933594,
      "max_norm/layer0": 221.12425231933594,
      "mean_norm": 66.61260223388672,
      "mean_norm/layer0": 66.61260223388672,
      "multicode_k": 1,
      "output_norm": 22.70729770024618,
      "output_norm/layer0": 22.70729770024618,
      "step": 8050
    },
    {
      "MSE": 508.0300794474282,
      "MSE/layer0": 508.0300794474282,
      "dead_code_fraction": 0.19355,
      "dead_code_fraction/layer0": 0.19355,
      "epoch": 1.33,
      "input_norm": 31.998755750656134,
      "input_norm/layer0": 31.998755750656134,
      "learning_rate": 0.005,
      "loss": 2.0065,
      "max_norm": 221.41090393066406,
      "max_norm/layer0": 221.41090393066406,
      "mean_norm": 66.68024253845215,
      "mean_norm/layer0": 66.68024253845215,
      "multicode_k": 1,
      "output_norm": 22.685567102432238,
      "output_norm/layer0": 22.685567102432238,
      "step": 8100
    },
    {
      "MSE": 506.83792968750004,
      "MSE/layer0": 506.83792968750004,
      "dead_code_fraction": 0.194,
      "dead_code_fraction/layer0": 0.194,
      "epoch": 1.34,
      "input_norm": 31.998766530354814,
      "input_norm/layer0": 31.998766530354814,
      "learning_rate": 0.005,
      "loss": 2.0545,
      "max_norm": 221.77352905273438,
      "max_norm/layer0": 221.77352905273438,
      "mean_norm": 66.74850654602051,
      "mean_norm/layer0": 66.74850654602051,
      "multicode_k": 1,
      "output_norm": 22.711014649073284,
      "output_norm/layer0": 22.711014649073284,
      "step": 8150
    },
    {
      "MSE": 506.1638347880046,
      "MSE/layer0": 506.1638347880046,
      "dead_code_fraction": 0.1922,
      "dead_code_fraction/layer0": 0.1922,
      "epoch": 1.34,
      "input_norm": 31.998765303293865,
      "input_norm/layer0": 31.998765303293865,
      "learning_rate": 0.005,
      "loss": 2.0291,
      "max_norm": 222.23851013183594,
      "max_norm/layer0": 222.23851013183594,
      "mean_norm": 66.81972694396973,
      "mean_norm/layer0": 66.81972694396973,
      "multicode_k": 1,
      "output_norm": 22.712359495162957,
      "output_norm/layer0": 22.712359495162957,
      "step": 8200
    },
    {
      "MSE": 505.4201058959959,
      "MSE/layer0": 505.4201058959959,
      "dead_code_fraction": 0.19165,
      "dead_code_fraction/layer0": 0.19165,
      "epoch": 1.35,
      "input_norm": 31.998765595753984,
      "input_norm/layer0": 31.998765595753984,
      "learning_rate": 0.005,
      "loss": 2.0255,
      "max_norm": 222.60708618164062,
      "max_norm/layer0": 222.60708618164062,
      "mean_norm": 66.89296340942383,
      "mean_norm/layer0": 66.89296340942383,
      "multicode_k": 1,
      "output_norm": 22.733057559331257,
      "output_norm/layer0": 22.733057559331257,
      "step": 8250
    },
    {
      "MSE": 506.6631129964193,
      "MSE/layer0": 506.6631129964193,
      "dead_code_fraction": 0.18985,
      "dead_code_fraction/layer0": 0.18985,
      "epoch": 1.35,
      "input_norm": 31.998774194717406,
      "input_norm/layer0": 31.998774194717406,
      "learning_rate": 0.005,
      "loss": 2.0543,
      "max_norm": 222.95948791503906,
      "max_norm/layer0": 222.95948791503906,
      "mean_norm": 66.95783233642578,
      "mean_norm/layer0": 66.95783233642578,
      "multicode_k": 1,
      "output_norm": 22.715471951166787,
      "output_norm/layer0": 22.715471951166787,
      "step": 8300
    },
    {
      "MSE": 505.8098661804198,
      "MSE/layer0": 505.8098661804198,
      "dead_code_fraction": 0.1901,
      "dead_code_fraction/layer0": 0.1901,
      "epoch": 1.36,
      "input_norm": 31.998776054382326,
      "input_norm/layer0": 31.998776054382326,
      "learning_rate": 0.005,
      "loss": 2.0361,
      "max_norm": 222.99290466308594,
      "max_norm/layer0": 222.99290466308594,
      "mean_norm": 67.03095436096191,
      "mean_norm/layer0": 67.03095436096191,
      "multicode_k": 1,
      "output_norm": 22.720023854573576,
      "output_norm/layer0": 22.720023854573576,
      "step": 8350
    },
    {
      "MSE": 504.6476872253421,
      "MSE/layer0": 504.6476872253421,
      "dead_code_fraction": 0.18865,
      "dead_code_fraction/layer0": 0.18865,
      "epoch": 1.36,
      "input_norm": 31.99877415021262,
      "input_norm/layer0": 31.99877415021262,
      "learning_rate": 0.005,
      "loss": 2.018,
      "max_norm": 222.99652099609375,
      "max_norm/layer0": 222.99652099609375,
      "mean_norm": 67.10310173034668,
      "mean_norm/layer0": 67.10310173034668,
      "multicode_k": 1,
      "output_norm": 22.743260552088422,
      "output_norm/layer0": 22.743260552088422,
      "step": 8400
    },
    {
      "MSE": 505.1742755126953,
      "MSE/layer0": 505.1742755126953,
      "dead_code_fraction": 0.18805,
      "dead_code_fraction/layer0": 0.18805,
      "epoch": 1.37,
      "input_norm": 31.998781833648685,
      "input_norm/layer0": 31.998781833648685,
      "learning_rate": 0.005,
      "loss": 2.0373,
      "max_norm": 223.39710998535156,
      "max_norm/layer0": 223.39710998535156,
      "mean_norm": 67.17368698120117,
      "mean_norm/layer0": 67.17368698120117,
      "multicode_k": 1,
      "output_norm": 22.74353121121724,
      "output_norm/layer0": 22.74353121121724,
      "step": 8450
    },
    {
      "MSE": 505.00153442382805,
      "MSE/layer0": 505.00153442382805,
      "dead_code_fraction": 0.1875,
      "dead_code_fraction/layer0": 0.1875,
      "epoch": 1.37,
      "input_norm": 31.998789456685383,
      "input_norm/layer0": 31.998789456685383,
      "learning_rate": 0.005,
      "loss": 2.0432,
      "max_norm": 223.86239624023438,
      "max_norm/layer0": 223.86239624023438,
      "mean_norm": 67.2455825805664,
      "mean_norm/layer0": 67.2455825805664,
      "multicode_k": 1,
      "output_norm": 22.747594401041667,
      "output_norm/layer0": 22.747594401041667,
      "step": 8500
    },
    {
      "epoch": 1.37,
      "eval_MSE/layer0": 502.9394664067146,
      "eval_accuracy": 0.5183496432580605,
      "eval_dead_code_fraction/layer0": 0.18745,
      "eval_input_norm/layer0": 31.998788164622738,
      "eval_loss": 2.042330265045166,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.756197618711013,
      "eval_runtime": 159.3738,
      "eval_samples_per_second": 29.007,
      "eval_steps_per_second": 1.813,
      "step": 8500
    },
    {
      "MSE": 504.47000788370775,
      "MSE/layer0": 504.47000788370775,
      "dead_code_fraction": 0.1867,
      "dead_code_fraction/layer0": 0.1867,
      "epoch": 1.38,
      "input_norm": 31.998792708714795,
      "input_norm/layer0": 31.998792708714795,
      "learning_rate": 0.005,
      "loss": 2.0483,
      "max_norm": 224.50177001953125,
      "max_norm/layer0": 224.50177001953125,
      "mean_norm": 67.31682586669922,
      "mean_norm/layer0": 67.31682586669922,
      "multicode_k": 1,
      "output_norm": 22.753840500513725,
      "output_norm/layer0": 22.753840500513725,
      "step": 8550
    },
    {
      "MSE": 504.7471296691896,
      "MSE/layer0": 504.7471296691896,
      "dead_code_fraction": 0.1861,
      "dead_code_fraction/layer0": 0.1861,
      "epoch": 1.38,
      "input_norm": 31.99879879315695,
      "input_norm/layer0": 31.99879879315695,
      "learning_rate": 0.005,
      "loss": 2.0626,
      "max_norm": 224.77008056640625,
      "max_norm/layer0": 224.77008056640625,
      "mean_norm": 67.38501358032227,
      "mean_norm/layer0": 67.38501358032227,
      "multicode_k": 1,
      "output_norm": 22.75965905507406,
      "output_norm/layer0": 22.75965905507406,
      "step": 8600
    },
    {
      "MSE": 504.43309575398786,
      "MSE/layer0": 504.43309575398786,
      "dead_code_fraction": 0.18575,
      "dead_code_fraction/layer0": 0.18575,
      "epoch": 1.39,
      "input_norm": 31.9987975247701,
      "input_norm/layer0": 31.9987975247701,
      "learning_rate": 0.005,
      "loss": 2.0528,
      "max_norm": 224.8895263671875,
      "max_norm/layer0": 224.8895263671875,
      "mean_norm": 67.45294189453125,
      "mean_norm/layer0": 67.45294189453125,
      "multicode_k": 1,
      "output_norm": 22.765578152338662,
      "output_norm/layer0": 22.765578152338662,
      "step": 8650
    },
    {
      "MSE": 504.8997240193688,
      "MSE/layer0": 504.8997240193688,
      "dead_code_fraction": 0.1849,
      "dead_code_fraction/layer0": 0.1849,
      "epoch": 1.39,
      "input_norm": 31.998805205027267,
      "input_norm/layer0": 31.998805205027267,
      "learning_rate": 0.005,
      "loss": 2.0355,
      "max_norm": 225.1109619140625,
      "max_norm/layer0": 225.1109619140625,
      "mean_norm": 67.51644897460938,
      "mean_norm/layer0": 67.51644897460938,
      "multicode_k": 1,
      "output_norm": 22.76556049982706,
      "output_norm/layer0": 22.76556049982706,
      "step": 8700
    },
    {
      "MSE": 504.98007812499975,
      "MSE/layer0": 504.98007812499975,
      "dead_code_fraction": 0.1841,
      "dead_code_fraction/layer0": 0.1841,
      "epoch": 1.4,
      "input_norm": 31.998811095555627,
      "input_norm/layer0": 31.998811095555627,
      "learning_rate": 0.005,
      "loss": 2.048,
      "max_norm": 225.3004608154297,
      "max_norm/layer0": 225.3004608154297,
      "mean_norm": 67.58170700073242,
      "mean_norm/layer0": 67.58170700073242,
      "multicode_k": 1,
      "output_norm": 22.734453417460124,
      "output_norm/layer0": 22.734453417460124,
      "step": 8750
    },
    {
      "MSE": 505.8172926839193,
      "MSE/layer0": 505.8172926839193,
      "dead_code_fraction": 0.1825,
      "dead_code_fraction/layer0": 0.1825,
      "epoch": 1.4,
      "input_norm": 31.998811902999876,
      "input_norm/layer0": 31.998811902999876,
      "learning_rate": 0.005,
      "loss": 2.0314,
      "max_norm": 225.43496704101562,
      "max_norm/layer0": 225.43496704101562,
      "mean_norm": 67.64213943481445,
      "mean_norm/layer0": 67.64213943481445,
      "multicode_k": 1,
      "output_norm": 22.746523040135706,
      "output_norm/layer0": 22.746523040135706,
      "step": 8800
    },
    {
      "MSE": 505.15463668823276,
      "MSE/layer0": 505.15463668823276,
      "dead_code_fraction": 0.1834,
      "dead_code_fraction/layer0": 0.1834,
      "epoch": 1.41,
      "input_norm": 31.99881089528401,
      "input_norm/layer0": 31.99881089528401,
      "learning_rate": 0.005,
      "loss": 2.0019,
      "max_norm": 225.2454376220703,
      "max_norm/layer0": 225.2454376220703,
      "mean_norm": 67.70701217651367,
      "mean_norm/layer0": 67.70701217651367,
      "multicode_k": 1,
      "output_norm": 22.74102473258972,
      "output_norm/layer0": 22.74102473258972,
      "step": 8850
    },
    {
      "MSE": 505.15305394490576,
      "MSE/layer0": 505.15305394490576,
      "dead_code_fraction": 0.18105,
      "dead_code_fraction/layer0": 0.18105,
      "epoch": 1.41,
      "input_norm": 31.99882117907206,
      "input_norm/layer0": 31.99882117907206,
      "learning_rate": 0.005,
      "loss": 2.0614,
      "max_norm": 224.98548889160156,
      "max_norm/layer0": 224.98548889160156,
      "mean_norm": 67.77053833007812,
      "mean_norm/layer0": 67.77053833007812,
      "multicode_k": 1,
      "output_norm": 22.750008074442544,
      "output_norm/layer0": 22.750008074442544,
      "step": 8900
    },
    {
      "MSE": 505.46065561930345,
      "MSE/layer0": 505.46065561930345,
      "dead_code_fraction": 0.1809,
      "dead_code_fraction/layer0": 0.1809,
      "epoch": 1.42,
      "input_norm": 31.99882030487061,
      "input_norm/layer0": 31.99882030487061,
      "learning_rate": 0.005,
      "loss": 2.0259,
      "max_norm": 224.90966796875,
      "max_norm/layer0": 224.90966796875,
      "mean_norm": 67.83388900756836,
      "mean_norm/layer0": 67.83388900756836,
      "multicode_k": 1,
      "output_norm": 22.744747044245393,
      "output_norm/layer0": 22.744747044245393,
      "step": 8950
    },
    {
      "MSE": 503.93126592000317,
      "MSE/layer0": 503.93126592000317,
      "dead_code_fraction": 0.1795,
      "dead_code_fraction/layer0": 0.1795,
      "epoch": 1.42,
      "input_norm": 31.99882487614949,
      "input_norm/layer0": 31.99882487614949,
      "learning_rate": 0.005,
      "loss": 2.0549,
      "max_norm": 224.75604248046875,
      "max_norm/layer0": 224.75604248046875,
      "mean_norm": 67.89757537841797,
      "mean_norm/layer0": 67.89757537841797,
      "multicode_k": 1,
      "output_norm": 22.767707106272383,
      "output_norm/layer0": 22.767707106272383,
      "step": 9000
    },
    {
      "epoch": 1.42,
      "eval_MSE/layer0": 502.90162357014304,
      "eval_accuracy": 0.518752237368134,
      "eval_dead_code_fraction/layer0": 0.1797,
      "eval_input_norm/layer0": 31.998819289515865,
      "eval_loss": 2.0394132137298584,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.772194602647794,
      "eval_runtime": 158.4408,
      "eval_samples_per_second": 29.178,
      "eval_steps_per_second": 1.824,
      "step": 9000
    },
    {
      "MSE": 504.23655522664376,
      "MSE/layer0": 504.23655522664376,
      "dead_code_fraction": 0.17875,
      "dead_code_fraction/layer0": 0.17875,
      "epoch": 1.43,
      "input_norm": 31.998824621836345,
      "input_norm/layer0": 31.998824621836345,
      "learning_rate": 0.005,
      "loss": 2.0392,
      "max_norm": 224.60926818847656,
      "max_norm/layer0": 224.60926818847656,
      "mean_norm": 67.96440505981445,
      "mean_norm/layer0": 67.96440505981445,
      "multicode_k": 1,
      "output_norm": 22.772467877070113,
      "output_norm/layer0": 22.772467877070113,
      "step": 9050
    },
    {
      "MSE": 503.93936604817725,
      "MSE/layer0": 503.93936604817725,
      "dead_code_fraction": 0.17785,
      "dead_code_fraction/layer0": 0.17785,
      "epoch": 1.43,
      "input_norm": 31.99882525444032,
      "input_norm/layer0": 31.99882525444032,
      "learning_rate": 0.005,
      "loss": 2.0329,
      "max_norm": 224.35545349121094,
      "max_norm/layer0": 224.35545349121094,
      "mean_norm": 68.02788925170898,
      "mean_norm/layer0": 68.02788925170898,
      "multicode_k": 1,
      "output_norm": 22.77433245976766,
      "output_norm/layer0": 22.77433245976766,
      "step": 9100
    },
    {
      "MSE": 504.38566899617547,
      "MSE/layer0": 504.38566899617547,
      "dead_code_fraction": 0.1771,
      "dead_code_fraction/layer0": 0.1771,
      "epoch": 1.44,
      "input_norm": 31.998831052780154,
      "input_norm/layer0": 31.998831052780154,
      "learning_rate": 0.005,
      "loss": 2.0175,
      "max_norm": 224.176025390625,
      "max_norm/layer0": 224.176025390625,
      "mean_norm": 68.09515762329102,
      "mean_norm/layer0": 68.09515762329102,
      "multicode_k": 1,
      "output_norm": 22.758301575978592,
      "output_norm/layer0": 22.758301575978592,
      "step": 9150
    },
    {
      "MSE": 503.9738773091634,
      "MSE/layer0": 503.9738773091634,
      "dead_code_fraction": 0.1763,
      "dead_code_fraction/layer0": 0.1763,
      "epoch": 1.44,
      "input_norm": 31.998839066823308,
      "input_norm/layer0": 31.998839066823308,
      "learning_rate": 0.005,
      "loss": 2.0462,
      "max_norm": 224.0868377685547,
      "max_norm/layer0": 224.0868377685547,
      "mean_norm": 68.16043853759766,
      "mean_norm/layer0": 68.16043853759766,
      "multicode_k": 1,
      "output_norm": 22.7744267431895,
      "output_norm/layer0": 22.7744267431895,
      "step": 9200
    },
    {
      "MSE": 503.29069310506196,
      "MSE/layer0": 503.29069310506196,
      "dead_code_fraction": 0.17485,
      "dead_code_fraction/layer0": 0.17485,
      "epoch": 1.45,
      "input_norm": 31.99883868853251,
      "input_norm/layer0": 31.99883868853251,
      "learning_rate": 0.005,
      "loss": 2.0416,
      "max_norm": 223.89230346679688,
      "max_norm/layer0": 223.89230346679688,
      "mean_norm": 68.22885513305664,
      "mean_norm/layer0": 68.22885513305664,
      "multicode_k": 1,
      "output_norm": 22.78441795984904,
      "output_norm/layer0": 22.78441795984904,
      "step": 9250
    },
    {
      "MSE": 504.4634376017252,
      "MSE/layer0": 504.4634376017252,
      "dead_code_fraction": 0.17465,
      "dead_code_fraction/layer0": 0.17465,
      "epoch": 1.45,
      "input_norm": 31.998847064971933,
      "input_norm/layer0": 31.998847064971933,
      "learning_rate": 0.005,
      "loss": 2.0822,
      "max_norm": 223.5952911376953,
      "max_norm/layer0": 223.5952911376953,
      "mean_norm": 68.2917366027832,
      "mean_norm/layer0": 68.2917366027832,
      "multicode_k": 1,
      "output_norm": 22.78019981384277,
      "output_norm/layer0": 22.78019981384277,
      "step": 9300
    },
    {
      "MSE": 504.5819336954755,
      "MSE/layer0": 504.5819336954755,
      "dead_code_fraction": 0.1737,
      "dead_code_fraction/layer0": 0.1737,
      "epoch": 1.46,
      "input_norm": 31.998844486872358,
      "input_norm/layer0": 31.998844486872358,
      "learning_rate": 0.005,
      "loss": 2.0181,
      "max_norm": 223.33349609375,
      "max_norm/layer0": 223.33349609375,
      "mean_norm": 68.3541030883789,
      "mean_norm/layer0": 68.3541030883789,
      "multicode_k": 1,
      "output_norm": 22.770421886444097,
      "output_norm/layer0": 22.770421886444097,
      "step": 9350
    },
    {
      "MSE": 504.08388671875014,
      "MSE/layer0": 504.08388671875014,
      "dead_code_fraction": 0.17315,
      "dead_code_fraction/layer0": 0.17315,
      "epoch": 1.46,
      "input_norm": 31.998852834701534,
      "input_norm/layer0": 31.998852834701534,
      "learning_rate": 0.005,
      "loss": 2.0332,
      "max_norm": 223.0471954345703,
      "max_norm/layer0": 223.0471954345703,
      "mean_norm": 68.41642379760742,
      "mean_norm/layer0": 68.41642379760742,
      "multicode_k": 1,
      "output_norm": 22.783455673853553,
      "output_norm/layer0": 22.783455673853553,
      "step": 9400
    },
    {
      "MSE": 504.4143726603196,
      "MSE/layer0": 504.4143726603196,
      "dead_code_fraction": 0.17145,
      "dead_code_fraction/layer0": 0.17145,
      "epoch": 1.47,
      "input_norm": 31.998856865564967,
      "input_norm/layer0": 31.998856865564967,
      "learning_rate": 0.005,
      "loss": 2.0241,
      "max_norm": 222.83218383789062,
      "max_norm/layer0": 222.83218383789062,
      "mean_norm": 68.48007202148438,
      "mean_norm/layer0": 68.48007202148438,
      "multicode_k": 1,
      "output_norm": 22.767489954630527,
      "output_norm/layer0": 22.767489954630527,
      "step": 9450
    },
    {
      "MSE": 503.2655168151856,
      "MSE/layer0": 503.2655168151856,
      "dead_code_fraction": 0.17245,
      "dead_code_fraction/layer0": 0.17245,
      "epoch": 1.47,
      "input_norm": 31.998857196172086,
      "input_norm/layer0": 31.998857196172086,
      "learning_rate": 0.005,
      "loss": 2.0087,
      "max_norm": 222.5254669189453,
      "max_norm/layer0": 222.5254669189453,
      "mean_norm": 68.54964065551758,
      "mean_norm/layer0": 68.54964065551758,
      "multicode_k": 1,
      "output_norm": 22.78383262634278,
      "output_norm/layer0": 22.78383262634278,
      "step": 9500
    },
    {
      "epoch": 1.47,
      "eval_MSE/layer0": 504.0087830256569,
      "eval_accuracy": 0.5192516739689711,
      "eval_dead_code_fraction/layer0": 0.1704,
      "eval_input_norm/layer0": 31.99886018302103,
      "eval_loss": 2.0364596843719482,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.799023320451585,
      "eval_runtime": 158.3046,
      "eval_samples_per_second": 29.203,
      "eval_steps_per_second": 1.826,
      "step": 9500
    },
    {
      "MSE": 502.63093187018274,
      "MSE/layer0": 502.63093187018274,
      "dead_code_fraction": 0.1713,
      "dead_code_fraction/layer0": 0.1713,
      "epoch": 1.48,
      "input_norm": 31.998863240132852,
      "input_norm/layer0": 31.998863240132852,
      "learning_rate": 0.005,
      "loss": 2.0083,
      "max_norm": 222.2374725341797,
      "max_norm/layer0": 222.2374725341797,
      "mean_norm": 68.61249160766602,
      "mean_norm/layer0": 68.61249160766602,
      "multicode_k": 1,
      "output_norm": 22.79880291995348,
      "output_norm/layer0": 22.79880291995348,
      "step": 9550
    },
    {
      "MSE": 505.36792836568793,
      "MSE/layer0": 505.36792836568793,
      "dead_code_fraction": 0.17135,
      "dead_code_fraction/layer0": 0.17135,
      "epoch": 2.0,
      "input_norm": 31.99885930271917,
      "input_norm/layer0": 31.99885930271917,
      "learning_rate": 0.005,
      "loss": 2.0034,
      "max_norm": 222.0310516357422,
      "max_norm/layer0": 222.0310516357422,
      "mean_norm": 68.67721176147461,
      "mean_norm/layer0": 68.67721176147461,
      "multicode_k": 1,
      "output_norm": 22.74409036474983,
      "output_norm/layer0": 22.74409036474983,
      "step": 9600
    },
    {
      "MSE": 502.98986485799134,
      "MSE/layer0": 502.98986485799134,
      "dead_code_fraction": 0.1697,
      "dead_code_fraction/layer0": 0.1697,
      "epoch": 2.01,
      "input_norm": 31.998873513539642,
      "input_norm/layer0": 31.998873513539642,
      "learning_rate": 0.005,
      "loss": 2.072,
      "max_norm": 222.00772094726562,
      "max_norm/layer0": 222.00772094726562,
      "mean_norm": 68.73538589477539,
      "mean_norm/layer0": 68.73538589477539,
      "multicode_k": 1,
      "output_norm": 22.796976168950394,
      "output_norm/layer0": 22.796976168950394,
      "step": 9650
    },
    {
      "MSE": 503.04733729044574,
      "MSE/layer0": 503.04733729044574,
      "dead_code_fraction": 0.16915,
      "dead_code_fraction/layer0": 0.16915,
      "epoch": 2.01,
      "input_norm": 31.998862508138025,
      "input_norm/layer0": 31.998862508138025,
      "learning_rate": 0.005,
      "loss": 1.9691,
      "max_norm": 221.80978393554688,
      "max_norm/layer0": 221.80978393554688,
      "mean_norm": 68.80109405517578,
      "mean_norm/layer0": 68.80109405517578,
      "multicode_k": 1,
      "output_norm": 22.794911410013835,
      "output_norm/layer0": 22.794911410013835,
      "step": 9700
    },
    {
      "MSE": 503.3161979675292,
      "MSE/layer0": 503.3161979675292,
      "dead_code_fraction": 0.16895,
      "dead_code_fraction/layer0": 0.16895,
      "epoch": 2.02,
      "input_norm": 31.998878345489487,
      "input_norm/layer0": 31.998878345489487,
      "learning_rate": 0.005,
      "loss": 2.0368,
      "max_norm": 221.684814453125,
      "max_norm/layer0": 221.684814453125,
      "mean_norm": 68.86429214477539,
      "mean_norm/layer0": 68.86429214477539,
      "multicode_k": 1,
      "output_norm": 22.785858039855956,
      "output_norm/layer0": 22.785858039855956,
      "step": 9750
    },
    {
      "MSE": 502.7885366821291,
      "MSE/layer0": 502.7885366821291,
      "dead_code_fraction": 0.16775,
      "dead_code_fraction/layer0": 0.16775,
      "epoch": 2.02,
      "input_norm": 31.998876323699957,
      "input_norm/layer0": 31.998876323699957,
      "learning_rate": 0.005,
      "loss": 2.0029,
      "max_norm": 221.55738830566406,
      "max_norm/layer0": 221.55738830566406,
      "mean_norm": 68.92353439331055,
      "mean_norm/layer0": 68.92353439331055,
      "multicode_k": 1,
      "output_norm": 22.80311137835186,
      "output_norm/layer0": 22.80311137835186,
      "step": 9800
    },
    {
      "MSE": 503.08141484578465,
      "MSE/layer0": 503.08141484578465,
      "dead_code_fraction": 0.16675,
      "dead_code_fraction/layer0": 0.16675,
      "epoch": 2.03,
      "input_norm": 31.998882681528727,
      "input_norm/layer0": 31.998882681528727,
      "learning_rate": 0.005,
      "loss": 2.0058,
      "max_norm": 221.4176025390625,
      "max_norm/layer0": 221.4176025390625,
      "mean_norm": 68.97920608520508,
      "mean_norm/layer0": 68.97920608520508,
      "multicode_k": 1,
      "output_norm": 22.79436633110047,
      "output_norm/layer0": 22.79436633110047,
      "step": 9850
    },
    {
      "MSE": 503.44391169230175,
      "MSE/layer0": 503.44391169230175,
      "dead_code_fraction": 0.16635,
      "dead_code_fraction/layer0": 0.16635,
      "epoch": 2.03,
      "input_norm": 31.998889300028488,
      "input_norm/layer0": 31.998889300028488,
      "learning_rate": 0.005,
      "loss": 2.0128,
      "max_norm": 220.8733673095703,
      "max_norm/layer0": 220.8733673095703,
      "mean_norm": 69.03522872924805,
      "mean_norm/layer0": 69.03522872924805,
      "multicode_k": 1,
      "output_norm": 22.793825833002728,
      "output_norm/layer0": 22.793825833002728,
      "step": 9900
    },
    {
      "MSE": 503.14160481770807,
      "MSE/layer0": 503.14160481770807,
      "dead_code_fraction": 0.1655,
      "dead_code_fraction/layer0": 0.1655,
      "epoch": 2.04,
      "input_norm": 31.99888905207317,
      "input_norm/layer0": 31.99888905207317,
      "learning_rate": 0.005,
      "loss": 2.0053,
      "max_norm": 220.66598510742188,
      "max_norm/layer0": 220.66598510742188,
      "mean_norm": 69.08990859985352,
      "mean_norm/layer0": 69.08990859985352,
      "multicode_k": 1,
      "output_norm": 22.802439581553138,
      "output_norm/layer0": 22.802439581553138,
      "step": 9950
    },
    {
      "MSE": 502.7584656778976,
      "MSE/layer0": 502.7584656778976,
      "dead_code_fraction": 0.16445,
      "dead_code_fraction/layer0": 0.16445,
      "epoch": 2.04,
      "input_norm": 31.998899453481037,
      "input_norm/layer0": 31.998899453481037,
      "learning_rate": 0.005,
      "loss": 2.0569,
      "max_norm": 220.5869903564453,
      "max_norm/layer0": 220.5869903564453,
      "mean_norm": 69.14492416381836,
      "mean_norm/layer0": 69.14492416381836,
      "multicode_k": 1,
      "output_norm": 22.808293444315584,
      "output_norm/layer0": 22.808293444315584,
      "step": 10000
    },
    {
      "epoch": 2.04,
      "eval_MSE/layer0": 501.8128262733759,
      "eval_accuracy": 0.5193506309245984,
      "eval_dead_code_fraction/layer0": 0.16395,
      "eval_input_norm/layer0": 31.998895487949337,
      "eval_loss": 2.0353407859802246,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 22.80092038433711,
      "eval_runtime": 158.6027,
      "eval_samples_per_second": 29.148,
      "eval_steps_per_second": 1.822,
      "step": 10000
    },
    {
      "MSE": 0.0,
      "MSE/layer0": 0.0,
      "dead_code_fraction": 1.0,
      "dead_code_fraction/layer0": 1.0,
      "epoch": 2.04,
      "input_norm": 0.0,
      "input_norm/layer0": 0.0,
      "max_norm": 220.5869903564453,
      "max_norm/layer0": 220.5869903564453,
      "mean_norm": 69.14492416381836,
      "mean_norm/layer0": 69.14492416381836,
      "multicode_k": 1,
      "output_norm": 0.0,
      "output_norm/layer0": 0.0,
      "step": 10000,
      "total_flos": 7.43098011353088e+16,
      "train_loss": 2.205516522693634,
      "train_runtime": 15654.0479,
      "train_samples_per_second": 61.326,
      "train_steps_per_second": 0.639
    }
  ],
  "logging_steps": 50,
  "max_steps": 10000,
  "num_train_epochs": 9223372036854775807,
  "save_steps": 500,
  "total_flos": 7.43098011353088e+16,
  "trial_name": null,
  "trial_params": null
}