{
  "best_metric": 1.89570152759552,
  "best_model_checkpoint": "/tmp/wandb/run-20240207_044253-56k3p8kp/files/train_output/checkpoint-10000",
  "epoch": 1.044022968505307,
  "eval_steps": 500,
  "global_step": 10000,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "MSE": 872.5187733968098,
      "MSE/layer0": 872.5187733968098,
      "dead_code_fraction": 0.0276,
      "dead_code_fraction/layer0": 0.0276,
      "epoch": 0.0,
      "input_norm": 31.997111479441326,
      "input_norm/layer0": 31.997111479441326,
      "learning_rate": 1e-06,
      "loss": 9.0051,
      "max_norm": 34.71393966674805,
      "max_norm/layer0": 34.71393966674805,
      "mean_norm": 31.98521327972412,
      "mean_norm/layer0": 31.98521327972412,
      "multicode_k": 1,
      "output_norm": 4.134780248006185,
      "output_norm/layer0": 4.134780248006185,
      "step": 1
    },
    {
      "MSE": 871.4381560241286,
      "MSE/layer0": 871.4381560241286,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.99644809839677,
      "input_norm/layer0": 31.99644809839677,
      "learning_rate": 5e-05,
      "loss": 7.0703,
      "max_norm": 34.72187423706055,
      "max_norm/layer0": 34.72187423706055,
      "mean_norm": 31.991936683654785,
      "mean_norm/layer0": 31.991936683654785,
      "multicode_k": 1,
      "output_norm": 4.145846879401173,
      "output_norm/layer0": 4.145846879401173,
      "step": 50
    },
    {
      "MSE": 868.4475470987957,
      "MSE/layer0": 868.4475470987957,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.995786774953213,
      "input_norm/layer0": 31.995786774953213,
      "learning_rate": 0.0001,
      "loss": 4.1515,
      "max_norm": 34.748802185058594,
      "max_norm/layer0": 34.748802185058594,
      "mean_norm": 32.0172176361084,
      "mean_norm/layer0": 32.0172176361084,
      "multicode_k": 1,
      "output_norm": 4.178660261631009,
      "output_norm/layer0": 4.178660261631009,
      "step": 100
    },
    {
      "MSE": 864.7878089396156,
      "MSE/layer0": 864.7878089396156,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.02,
      "input_norm": 31.995868380864444,
      "input_norm/layer0": 31.995868380864444,
      "learning_rate": 0.00015,
      "loss": 3.596,
      "max_norm": 34.7879753112793,
      "max_norm/layer0": 34.7879753112793,
      "mean_norm": 32.057809829711914,
      "mean_norm/layer0": 32.057809829711914,
      "multicode_k": 1,
      "output_norm": 4.227458424568177,
      "output_norm/layer0": 4.227458424568177,
      "step": 150
    },
    {
      "MSE": 862.2720657348631,
      "MSE/layer0": 862.2720657348631,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.02,
      "input_norm": 31.996261011759444,
      "input_norm/layer0": 31.996261011759444,
      "learning_rate": 0.0002,
      "loss": 3.3864,
      "max_norm": 34.834476470947266,
      "max_norm/layer0": 34.834476470947266,
      "mean_norm": 32.09993934631348,
      "mean_norm/layer0": 32.09993934631348,
      "multicode_k": 1,
      "output_norm": 4.271083230972291,
      "output_norm/layer0": 4.271083230972291,
      "step": 200
    },
    {
      "MSE": 860.8860168457031,
      "MSE/layer0": 860.8860168457031,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.03,
      "input_norm": 31.99663330396016,
      "input_norm/layer0": 31.99663330396016,
      "learning_rate": 0.00025,
      "loss": 3.1841,
      "max_norm": 34.880577087402344,
      "max_norm/layer0": 34.880577087402344,
      "mean_norm": 32.15042304992676,
      "mean_norm/layer0": 32.15042304992676,
      "multicode_k": 1,
      "output_norm": 4.302526236375174,
      "output_norm/layer0": 4.302526236375174,
      "step": 250
    },
    {
      "MSE": 859.4145241292313,
      "MSE/layer0": 859.4145241292313,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.03,
      "input_norm": 31.99707999547323,
      "input_norm/layer0": 31.99707999547323,
      "learning_rate": 0.0003,
      "loss": 2.9941,
      "max_norm": 34.94011688232422,
      "max_norm/layer0": 34.94011688232422,
      "mean_norm": 32.21405220031738,
      "mean_norm/layer0": 32.21405220031738,
      "multicode_k": 1,
      "output_norm": 4.340623443921407,
      "output_norm/layer0": 4.340623443921407,
      "step": 300
    },
    {
      "MSE": 857.4514228312173,
      "MSE/layer0": 857.4514228312173,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.04,
      "input_norm": 31.997263495127353,
      "input_norm/layer0": 31.997263495127353,
      "learning_rate": 0.00035,
      "loss": 2.8154,
      "max_norm": 35.02033996582031,
      "max_norm/layer0": 35.02033996582031,
      "mean_norm": 32.2895393371582,
      "mean_norm/layer0": 32.2895393371582,
      "multicode_k": 1,
      "output_norm": 4.388785634040833,
      "output_norm/layer0": 4.388785634040833,
      "step": 350
    },
    {
      "MSE": 855.6023776245115,
      "MSE/layer0": 855.6023776245115,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.04,
      "input_norm": 31.997391548156735,
      "input_norm/layer0": 31.997391548156735,
      "learning_rate": 0.0004,
      "loss": 2.6472,
      "max_norm": 35.093902587890625,
      "max_norm/layer0": 35.093902587890625,
      "mean_norm": 32.36477088928223,
      "mean_norm/layer0": 32.36477088928223,
      "multicode_k": 1,
      "output_norm": 4.438224600950877,
      "output_norm/layer0": 4.438224600950877,
      "step": 400
    },
    {
      "MSE": 852.2393107096357,
      "MSE/layer0": 852.2393107096357,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.05,
      "input_norm": 31.997483587265002,
      "input_norm/layer0": 31.997483587265002,
      "learning_rate": 0.00045000000000000004,
      "loss": 2.5584,
      "max_norm": 35.304176330566406,
      "max_norm/layer0": 35.304176330566406,
      "mean_norm": 32.54551696777344,
      "mean_norm/layer0": 32.54551696777344,
      "multicode_k": 1,
      "output_norm": 4.531697844664256,
      "output_norm/layer0": 4.531697844664256,
      "step": 450
    },
    {
      "MSE": 845.160081481933,
      "MSE/layer0": 845.160081481933,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.05,
      "input_norm": 31.997576513290404,
      "input_norm/layer0": 31.997576513290404,
      "learning_rate": 0.0005,
      "loss": 2.5072,
      "max_norm": 35.78097915649414,
      "max_norm/layer0": 35.78097915649414,
      "mean_norm": 32.836992263793945,
      "mean_norm/layer0": 32.836992263793945,
      "multicode_k": 1,
      "output_norm": 4.75731077671051,
      "output_norm/layer0": 4.75731077671051,
      "step": 500
    },
    {
      "epoch": 0.05,
      "eval_MSE/layer0": 841.1602262364518,
      "eval_accuracy": 0.4578774282778804,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99765928777141,
      "eval_loss": 2.476405382156372,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 4.911408371361153,
      "eval_runtime": 73.5499,
      "eval_samples_per_second": 62.855,
      "eval_steps_per_second": 7.859,
      "step": 500
    },
    {
      "MSE": 837.1320628865564,
      "MSE/layer0": 837.1320628865564,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.06,
      "input_norm": 31.997703491846714,
      "input_norm/layer0": 31.997703491846714,
      "learning_rate": 0.0004973684210526315,
      "loss": 2.446,
      "max_norm": 36.301849365234375,
      "max_norm/layer0": 36.301849365234375,
      "mean_norm": 33.16576957702637,
      "mean_norm/layer0": 33.16576957702637,
      "multicode_k": 1,
      "output_norm": 5.083427506287892,
      "output_norm/layer0": 5.083427506287892,
      "step": 550
    },
    {
      "MSE": 829.8174697875975,
      "MSE/layer0": 829.8174697875975,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.06,
      "input_norm": 31.997781289418548,
      "input_norm/layer0": 31.997781289418548,
      "learning_rate": 0.0004947368421052632,
      "loss": 2.4026,
      "max_norm": 36.790077209472656,
      "max_norm/layer0": 36.790077209472656,
      "mean_norm": 33.519426345825195,
      "mean_norm/layer0": 33.519426345825195,
      "multicode_k": 1,
      "output_norm": 5.438902084827422,
      "output_norm/layer0": 5.438902084827422,
      "step": 600
    },
    {
      "MSE": 823.647299601237,
      "MSE/layer0": 823.647299601237,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.07,
      "input_norm": 31.997854344050104,
      "input_norm/layer0": 31.997854344050104,
      "learning_rate": 0.0004921052631578947,
      "loss": 2.3506,
      "max_norm": 37.23988723754883,
      "max_norm/layer0": 37.23988723754883,
      "mean_norm": 33.882219314575195,
      "mean_norm/layer0": 33.882219314575195,
      "multicode_k": 1,
      "output_norm": 5.780141766071318,
      "output_norm/layer0": 5.780141766071318,
      "step": 650
    },
    {
      "MSE": 818.3900874837236,
      "MSE/layer0": 818.3900874837236,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.07,
      "input_norm": 31.99789853731792,
      "input_norm/layer0": 31.99789853731792,
      "learning_rate": 0.0004894736842105264,
      "loss": 2.3252,
      "max_norm": 37.74921417236328,
      "max_norm/layer0": 37.74921417236328,
      "mean_norm": 34.241193771362305,
      "mean_norm/layer0": 34.241193771362305,
      "multicode_k": 1,
      "output_norm": 6.09345253547033,
      "output_norm/layer0": 6.09345253547033,
      "step": 700
    },
    {
      "MSE": 813.5141651407878,
      "MSE/layer0": 813.5141651407878,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.08,
      "input_norm": 31.99791718482971,
      "input_norm/layer0": 31.99791718482971,
      "learning_rate": 0.0004868421052631579,
      "loss": 2.2972,
      "max_norm": 38.29411315917969,
      "max_norm/layer0": 38.29411315917969,
      "mean_norm": 34.602651596069336,
      "mean_norm/layer0": 34.602651596069336,
      "multicode_k": 1,
      "output_norm": 6.373116828600564,
      "output_norm/layer0": 6.373116828600564,
      "step": 750
    },
    {
      "MSE": 808.9583784993486,
      "MSE/layer0": 808.9583784993486,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.08,
      "input_norm": 31.997929916381842,
      "input_norm/layer0": 31.997929916381842,
      "learning_rate": 0.0004842105263157895,
      "loss": 2.2848,
      "max_norm": 38.83885955810547,
      "max_norm/layer0": 38.83885955810547,
      "mean_norm": 34.96581268310547,
      "mean_norm/layer0": 34.96581268310547,
      "multicode_k": 1,
      "output_norm": 6.6348445963859515,
      "output_norm/layer0": 6.6348445963859515,
      "step": 800
    },
    {
      "MSE": 805.0894353230792,
      "MSE/layer0": 805.0894353230792,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.09,
      "input_norm": 31.99793632825216,
      "input_norm/layer0": 31.99793632825216,
      "learning_rate": 0.00048157894736842105,
      "loss": 2.2718,
      "max_norm": 39.34720993041992,
      "max_norm/layer0": 39.34720993041992,
      "mean_norm": 35.32806396484375,
      "mean_norm/layer0": 35.32806396484375,
      "multicode_k": 1,
      "output_norm": 6.866891795794173,
      "output_norm/layer0": 6.866891795794173,
      "step": 850
    },
    {
      "MSE": 801.1131992594401,
      "MSE/layer0": 801.1131992594401,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.09,
      "input_norm": 31.997941767374677,
      "input_norm/layer0": 31.997941767374677,
      "learning_rate": 0.00047894736842105264,
      "loss": 2.2552,
      "max_norm": 39.885169982910156,
      "max_norm/layer0": 39.885169982910156,
      "mean_norm": 35.689327239990234,
      "mean_norm/layer0": 35.689327239990234,
      "multicode_k": 1,
      "output_norm": 7.08060004631678,
      "output_norm/layer0": 7.08060004631678,
      "step": 900
    },
    {
      "MSE": 797.5655348714191,
      "MSE/layer0": 797.5655348714191,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.1,
      "input_norm": 31.997945496241247,
      "input_norm/layer0": 31.997945496241247,
      "learning_rate": 0.0004763157894736842,
      "loss": 2.2364,
      "max_norm": 40.398529052734375,
      "max_norm/layer0": 40.398529052734375,
      "mean_norm": 36.051015853881836,
      "mean_norm/layer0": 36.051015853881836,
      "multicode_k": 1,
      "output_norm": 7.280441036224362,
      "output_norm/layer0": 7.280441036224362,
      "step": 950
    },
    {
      "MSE": 794.0057167561844,
      "MSE/layer0": 794.0057167561844,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.1,
      "input_norm": 31.997958205540975,
      "input_norm/layer0": 31.997958205540975,
      "learning_rate": 0.00047368421052631577,
      "loss": 2.2285,
      "max_norm": 40.882999420166016,
      "max_norm/layer0": 40.882999420166016,
      "mean_norm": 36.412479400634766,
      "mean_norm/layer0": 36.412479400634766,
      "multicode_k": 1,
      "output_norm": 7.463625483512881,
      "output_norm/layer0": 7.463625483512881,
      "step": 1000
    },
    {
      "epoch": 0.1,
      "eval_MSE/layer0": 792.3022871601257,
      "eval_accuracy": 0.49262569806414397,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997970815399036,
      "eval_loss": 2.2265193462371826,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 7.55243569582849,
      "eval_runtime": 73.9102,
      "eval_samples_per_second": 62.549,
      "eval_steps_per_second": 7.82,
      "step": 1000
    },
    {
      "MSE": 790.4031213378905,
      "MSE/layer0": 790.4031213378905,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.11,
      "input_norm": 31.997961893081662,
      "input_norm/layer0": 31.997961893081662,
      "learning_rate": 0.0004710526315789474,
      "loss": 2.2276,
      "max_norm": 41.373714447021484,
      "max_norm/layer0": 41.373714447021484,
      "mean_norm": 36.77394676208496,
      "mean_norm/layer0": 36.77394676208496,
      "multicode_k": 1,
      "output_norm": 7.636834317048386,
      "output_norm/layer0": 7.636834317048386,
      "step": 1050
    },
    {
      "MSE": 786.9933625284832,
      "MSE/layer0": 786.9933625284832,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.11,
      "input_norm": 31.99796496391297,
      "input_norm/layer0": 31.99796496391297,
      "learning_rate": 0.00046842105263157895,
      "loss": 2.2167,
      "max_norm": 41.845481872558594,
      "max_norm/layer0": 41.845481872558594,
      "mean_norm": 37.13482093811035,
      "mean_norm/layer0": 37.13482093811035,
      "multicode_k": 1,
      "output_norm": 7.803330462773646,
      "output_norm/layer0": 7.803330462773646,
      "step": 1100
    },
    {
      "MSE": 783.8570914713541,
      "MSE/layer0": 783.8570914713541,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.12,
      "input_norm": 31.997962007522577,
      "input_norm/layer0": 31.997962007522577,
      "learning_rate": 0.00046578947368421054,
      "loss": 2.2049,
      "max_norm": 42.328094482421875,
      "max_norm/layer0": 42.328094482421875,
      "mean_norm": 37.49737358093262,
      "mean_norm/layer0": 37.49737358093262,
      "multicode_k": 1,
      "output_norm": 7.957673575878145,
      "output_norm/layer0": 7.957673575878145,
      "step": 1150
    },
    {
      "MSE": 780.325506286621,
      "MSE/layer0": 780.325506286621,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.13,
      "input_norm": 31.997955818176273,
      "input_norm/layer0": 31.997955818176273,
      "learning_rate": 0.00046315789473684214,
      "loss": 2.2048,
      "max_norm": 42.827125549316406,
      "max_norm/layer0": 42.827125549316406,
      "mean_norm": 37.85981369018555,
      "mean_norm/layer0": 37.85981369018555,
      "multicode_k": 1,
      "output_norm": 8.110501464207967,
      "output_norm/layer0": 8.110501464207967,
      "step": 1200
    },
    {
      "MSE": 777.4963677978517,
      "MSE/layer0": 777.4963677978517,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.13,
      "input_norm": 31.997957773208608,
      "input_norm/layer0": 31.997957773208608,
      "learning_rate": 0.0004605263157894737,
      "loss": 2.1813,
      "max_norm": 43.32162094116211,
      "max_norm/layer0": 43.32162094116211,
      "mean_norm": 38.223052978515625,
      "mean_norm/layer0": 38.223052978515625,
      "multicode_k": 1,
      "output_norm": 8.244436805248263,
      "output_norm/layer0": 8.244436805248263,
      "step": 1250
    },
    {
      "MSE": 774.260437520345,
      "MSE/layer0": 774.260437520345,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.14,
      "input_norm": 31.99796381632487,
      "input_norm/layer0": 31.99796381632487,
      "learning_rate": 0.00045789473684210527,
      "loss": 2.1836,
      "max_norm": 43.81217575073242,
      "max_norm/layer0": 43.81217575073242,
      "mean_norm": 38.58406066894531,
      "mean_norm/layer0": 38.58406066894531,
      "multicode_k": 1,
      "output_norm": 8.38570425987244,
      "output_norm/layer0": 8.38570425987244,
      "step": 1300
    },
    {
      "MSE": 771.4710861206056,
      "MSE/layer0": 771.4710861206056,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.14,
      "input_norm": 31.997958866755184,
      "input_norm/layer0": 31.997958866755184,
      "learning_rate": 0.00045526315789473686,
      "loss": 2.1749,
      "max_norm": 44.29291915893555,
      "max_norm/layer0": 44.29291915893555,
      "mean_norm": 38.94841957092285,
      "mean_norm/layer0": 38.94841957092285,
      "multicode_k": 1,
      "output_norm": 8.50825534900029,
      "output_norm/layer0": 8.50825534900029,
      "step": 1350
    },
    {
      "MSE": 768.6556185913084,
      "MSE/layer0": 768.6556185913084,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.15,
      "input_norm": 31.99795674959818,
      "input_norm/layer0": 31.99795674959818,
      "learning_rate": 0.00045263157894736845,
      "loss": 2.1767,
      "max_norm": 44.80799865722656,
      "max_norm/layer0": 44.80799865722656,
      "mean_norm": 39.31004524230957,
      "mean_norm/layer0": 39.31004524230957,
      "multicode_k": 1,
      "output_norm": 8.633222222328184,
      "output_norm/layer0": 8.633222222328184,
      "step": 1400
    },
    {
      "MSE": 765.9088921101885,
      "MSE/layer0": 765.9088921101885,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.15,
      "input_norm": 31.99795736630759,
      "input_norm/layer0": 31.99795736630759,
      "learning_rate": 0.00045000000000000004,
      "loss": 2.1614,
      "max_norm": 45.24712371826172,
      "max_norm/layer0": 45.24712371826172,
      "mean_norm": 39.66674041748047,
      "mean_norm/layer0": 39.66674041748047,
      "multicode_k": 1,
      "output_norm": 8.743508942921961,
      "output_norm/layer0": 8.743508942921961,
      "step": 1450
    },
    {
      "MSE": 763.2800780232742,
      "MSE/layer0": 763.2800780232742,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.16,
      "input_norm": 31.997952944437664,
      "input_norm/layer0": 31.997952944437664,
      "learning_rate": 0.0004473684210526316,
      "loss": 2.1472,
      "max_norm": 45.6886100769043,
      "max_norm/layer0": 45.6886100769043,
      "mean_norm": 40.02728462219238,
      "mean_norm/layer0": 40.02728462219238,
      "multicode_k": 1,
      "output_norm": 8.859908480644224,
      "output_norm/layer0": 8.859908480644224,
      "step": 1500
    },
    {
      "epoch": 0.16,
      "eval_MSE/layer0": 761.8682555426203,
      "eval_accuracy": 0.502513147213907,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99796608230291,
      "eval_loss": 2.1583588123321533,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 8.92388377993132,
      "eval_runtime": 73.3386,
      "eval_samples_per_second": 63.036,
      "eval_steps_per_second": 7.881,
      "step": 1500
    },
    {
      "MSE": 760.1600253295896,
      "MSE/layer0": 760.1600253295896,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.16,
      "input_norm": 31.997961203257255,
      "input_norm/layer0": 31.997961203257255,
      "learning_rate": 0.00044473684210526317,
      "loss": 2.1601,
      "max_norm": 46.172386169433594,
      "max_norm/layer0": 46.172386169433594,
      "mean_norm": 40.38890838623047,
      "mean_norm/layer0": 40.38890838623047,
      "multicode_k": 1,
      "output_norm": 8.976485926310215,
      "output_norm/layer0": 8.976485926310215,
      "step": 1550
    },
    {
      "MSE": 757.7968755086266,
      "MSE/layer0": 757.7968755086266,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.17,
      "input_norm": 31.99795768419901,
      "input_norm/layer0": 31.99795768419901,
      "learning_rate": 0.0004421052631578947,
      "loss": 2.1503,
      "max_norm": 46.59892272949219,
      "max_norm/layer0": 46.59892272949219,
      "mean_norm": 40.74970626831055,
      "mean_norm/layer0": 40.74970626831055,
      "multicode_k": 1,
      "output_norm": 9.079196619192757,
      "output_norm/layer0": 9.079196619192757,
      "step": 1600
    },
    {
      "MSE": 755.1489293416341,
      "MSE/layer0": 755.1489293416341,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.17,
      "input_norm": 31.997956597010287,
      "input_norm/layer0": 31.997956597010287,
      "learning_rate": 0.0004394736842105263,
      "loss": 2.1474,
      "max_norm": 47.01366424560547,
      "max_norm/layer0": 47.01366424560547,
      "mean_norm": 41.107492446899414,
      "mean_norm/layer0": 41.107492446899414,
      "multicode_k": 1,
      "output_norm": 9.18502354939779,
      "output_norm/layer0": 9.18502354939779,
      "step": 1650
    },
    {
      "MSE": 752.7132907104492,
      "MSE/layer0": 752.7132907104492,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.18,
      "input_norm": 31.997961333592727,
      "input_norm/layer0": 31.997961333592727,
      "learning_rate": 0.00043684210526315795,
      "loss": 2.1451,
      "max_norm": 47.46398162841797,
      "max_norm/layer0": 47.46398162841797,
      "mean_norm": 41.466739654541016,
      "mean_norm/layer0": 41.466739654541016,
      "multicode_k": 1,
      "output_norm": 9.288365476131446,
      "output_norm/layer0": 9.288365476131446,
      "step": 1700
    },
    {
      "MSE": 750.1894300333656,
      "MSE/layer0": 750.1894300333656,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.18,
      "input_norm": 31.99795596122742,
      "input_norm/layer0": 31.99795596122742,
      "learning_rate": 0.0004342105263157895,
      "loss": 2.1298,
      "max_norm": 47.89784240722656,
      "max_norm/layer0": 47.89784240722656,
      "mean_norm": 41.825233459472656,
      "mean_norm/layer0": 41.825233459472656,
      "multicode_k": 1,
      "output_norm": 9.383608838717148,
      "output_norm/layer0": 9.383608838717148,
      "step": 1750
    },
    {
      "MSE": 747.6542997233073,
      "MSE/layer0": 747.6542997233073,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.19,
      "input_norm": 31.997955916722606,
      "input_norm/layer0": 31.997955916722606,
      "learning_rate": 0.0004315789473684211,
      "loss": 2.1238,
      "max_norm": 48.32524871826172,
      "max_norm/layer0": 48.32524871826172,
      "mean_norm": 42.18182373046875,
      "mean_norm/layer0": 42.18182373046875,
      "multicode_k": 1,
      "output_norm": 9.481378455162048,
      "output_norm/layer0": 9.481378455162048,
      "step": 1800
    },
    {
      "MSE": 745.4623332722983,
      "MSE/layer0": 745.4623332722983,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.19,
      "input_norm": 31.99795308430989,
      "input_norm/layer0": 31.99795308430989,
      "learning_rate": 0.0004289473684210526,
      "loss": 2.1193,
      "max_norm": 48.75049591064453,
      "max_norm/layer0": 48.75049591064453,
      "mean_norm": 42.53817176818848,
      "mean_norm/layer0": 42.53817176818848,
      "multicode_k": 1,
      "output_norm": 9.570223178863522,
      "output_norm/layer0": 9.570223178863522,
      "step": 1850
    },
    {
      "MSE": 743.2356170654296,
      "MSE/layer0": 743.2356170654296,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.2,
      "input_norm": 31.997956037521366,
      "input_norm/layer0": 31.997956037521366,
      "learning_rate": 0.0004263157894736842,
      "loss": 2.114,
      "max_norm": 49.169532775878906,
      "max_norm/layer0": 49.169532775878906,
      "mean_norm": 42.89301300048828,
      "mean_norm/layer0": 42.89301300048828,
      "multicode_k": 1,
      "output_norm": 9.656177865664167,
      "output_norm/layer0": 9.656177865664167,
      "step": 1900
    },
    {
      "MSE": 740.6696187337238,
      "MSE/layer0": 740.6696187337238,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.2,
      "input_norm": 31.997947629292796,
      "input_norm/layer0": 31.997947629292796,
      "learning_rate": 0.0004236842105263158,
      "loss": 2.1208,
      "max_norm": 49.5915641784668,
      "max_norm/layer0": 49.5915641784668,
      "mean_norm": 43.247257232666016,
      "mean_norm/layer0": 43.247257232666016,
      "multicode_k": 1,
      "output_norm": 9.750187404950456,
      "output_norm/layer0": 9.750187404950456,
      "step": 1950
    },
    {
      "MSE": 738.2711766560866,
      "MSE/layer0": 738.2711766560866,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.21,
      "input_norm": 31.99795049031576,
      "input_norm/layer0": 31.99795049031576,
      "learning_rate": 0.00042105263157894734,
      "loss": 2.1144,
      "max_norm": 50.01121520996094,
      "max_norm/layer0": 50.01121520996094,
      "mean_norm": 43.60071563720703,
      "mean_norm/layer0": 43.60071563720703,
      "multicode_k": 1,
      "output_norm": 9.839046444892887,
      "output_norm/layer0": 9.839046444892887,
      "step": 2000
    },
    {
      "epoch": 0.21,
      "eval_MSE/layer0": 737.1842960305685,
      "eval_accuracy": 0.5089533842961654,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997949216728358,
      "eval_loss": 2.112781524658203,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 9.899169789850005,
      "eval_runtime": 73.2721,
      "eval_samples_per_second": 63.094,
      "eval_steps_per_second": 7.888,
      "step": 2000
    },
    {
      "MSE": 736.3252647908528,
      "MSE/layer0": 736.3252647908528,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.21,
      "input_norm": 31.997952928543082,
      "input_norm/layer0": 31.997952928543082,
      "learning_rate": 0.000418421052631579,
      "loss": 2.1054,
      "max_norm": 50.480525970458984,
      "max_norm/layer0": 50.480525970458984,
      "mean_norm": 43.9530086517334,
      "mean_norm/layer0": 43.9530086517334,
      "multicode_k": 1,
      "output_norm": 9.923008087476088,
      "output_norm/layer0": 9.923008087476088,
      "step": 2050
    },
    {
      "MSE": 734.2413449096682,
      "MSE/layer0": 734.2413449096682,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.22,
      "input_norm": 31.99795233090719,
      "input_norm/layer0": 31.99795233090719,
      "learning_rate": 0.0004157894736842106,
      "loss": 2.114,
      "max_norm": 50.909828186035156,
      "max_norm/layer0": 50.909828186035156,
      "mean_norm": 44.302608489990234,
      "mean_norm/layer0": 44.302608489990234,
      "multicode_k": 1,
      "output_norm": 9.99465080579122,
      "output_norm/layer0": 9.99465080579122,
      "step": 2100
    },
    {
      "MSE": 732.1211085001627,
      "MSE/layer0": 732.1211085001627,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.22,
      "input_norm": 31.997947177886957,
      "input_norm/layer0": 31.997947177886957,
      "learning_rate": 0.0004131578947368421,
      "loss": 2.1053,
      "max_norm": 51.30076217651367,
      "max_norm/layer0": 51.30076217651367,
      "mean_norm": 44.650190353393555,
      "mean_norm/layer0": 44.650190353393555,
      "multicode_k": 1,
      "output_norm": 10.083865798314415,
      "output_norm/layer0": 10.083865798314415,
      "step": 2150
    },
    {
      "MSE": 729.7699541219072,
      "MSE/layer0": 729.7699541219072,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.23,
      "input_norm": 31.997944199244184,
      "input_norm/layer0": 31.997944199244184,
      "learning_rate": 0.0004105263157894737,
      "loss": 2.092,
      "max_norm": 51.70292282104492,
      "max_norm/layer0": 51.70292282104492,
      "mean_norm": 44.99736022949219,
      "mean_norm/layer0": 44.99736022949219,
      "multicode_k": 1,
      "output_norm": 10.171215546925865,
      "output_norm/layer0": 10.171215546925865,
      "step": 2200
    },
    {
      "MSE": 727.7426215616864,
      "MSE/layer0": 727.7426215616864,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.23,
      "input_norm": 31.997949040730795,
      "input_norm/layer0": 31.997949040730795,
      "learning_rate": 0.00040789473684210524,
      "loss": 2.0989,
      "max_norm": 52.09043502807617,
      "max_norm/layer0": 52.09043502807617,
      "mean_norm": 45.34288787841797,
      "mean_norm/layer0": 45.34288787841797,
      "multicode_k": 1,
      "output_norm": 10.245072917938227,
      "output_norm/layer0": 10.245072917938227,
      "step": 2250
    },
    {
      "MSE": 725.7510225423177,
      "MSE/layer0": 725.7510225423177,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.24,
      "input_norm": 31.997945086161295,
      "input_norm/layer0": 31.997945086161295,
      "learning_rate": 0.00040526315789473684,
      "loss": 2.0921,
      "max_norm": 52.48381423950195,
      "max_norm/layer0": 52.48381423950195,
      "mean_norm": 45.685386657714844,
      "mean_norm/layer0": 45.685386657714844,
      "multicode_k": 1,
      "output_norm": 10.316563812891642,
      "output_norm/layer0": 10.316563812891642,
      "step": 2300
    },
    {
      "MSE": 723.730980834961,
      "MSE/layer0": 723.730980834961,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.25,
      "input_norm": 31.997938013076794,
      "input_norm/layer0": 31.997938013076794,
      "learning_rate": 0.00040263157894736843,
      "loss": 2.0863,
      "max_norm": 52.871910095214844,
      "max_norm/layer0": 52.871910095214844,
      "mean_norm": 46.027950286865234,
      "mean_norm/layer0": 46.027950286865234,
      "multicode_k": 1,
      "output_norm": 10.396288099288938,
      "output_norm/layer0": 10.396288099288938,
      "step": 2350
    },
    {
      "MSE": 721.850106608073,
      "MSE/layer0": 721.850106608073,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.25,
      "input_norm": 31.99794317245484,
      "input_norm/layer0": 31.99794317245484,
      "learning_rate": 0.0004,
      "loss": 2.0883,
      "max_norm": 53.25300598144531,
      "max_norm/layer0": 53.25300598144531,
      "mean_norm": 46.366220474243164,
      "mean_norm/layer0": 46.366220474243164,
      "multicode_k": 1,
      "output_norm": 10.462737544377642,
      "output_norm/layer0": 10.462737544377642,
      "step": 2400
    },
    {
      "MSE": 720.002911987305,
      "MSE/layer0": 720.002911987305,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.26,
      "input_norm": 31.997945442199722,
      "input_norm/layer0": 31.997945442199722,
      "learning_rate": 0.0003973684210526316,
      "loss": 2.0813,
      "max_norm": 53.6557502746582,
      "max_norm/layer0": 53.6557502746582,
      "mean_norm": 46.70218849182129,
      "mean_norm/layer0": 46.70218849182129,
      "multicode_k": 1,
      "output_norm": 10.54251501719157,
      "output_norm/layer0": 10.54251501719157,
      "step": 2450
    },
    {
      "MSE": 717.8726328531905,
      "MSE/layer0": 717.8726328531905,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.26,
      "input_norm": 31.997946141560867,
      "input_norm/layer0": 31.997946141560867,
      "learning_rate": 0.00039473684210526315,
      "loss": 2.0847,
      "max_norm": 54.013648986816406,
      "max_norm/layer0": 54.013648986816406,
      "mean_norm": 47.03492546081543,
      "mean_norm/layer0": 47.03492546081543,
      "multicode_k": 1,
      "output_norm": 10.61746094703674,
      "output_norm/layer0": 10.61746094703674,
      "step": 2500
    },
    {
      "epoch": 0.26,
      "eval_MSE/layer0": 716.9390104187793,
      "eval_accuracy": 0.5142129041984603,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997947305666536,
      "eval_loss": 2.0790653228759766,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 10.657726783760687,
      "eval_runtime": 73.6422,
      "eval_samples_per_second": 62.776,
      "eval_steps_per_second": 7.849,
      "step": 2500
    },
    {
      "MSE": 715.8716929117836,
      "MSE/layer0": 715.8716929117836,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.27,
      "input_norm": 31.99793814023335,
      "input_norm/layer0": 31.99793814023335,
      "learning_rate": 0.00039210526315789474,
      "loss": 2.0789,
      "max_norm": 54.395057678222656,
      "max_norm/layer0": 54.395057678222656,
      "mean_norm": 47.36547088623047,
      "mean_norm/layer0": 47.36547088623047,
      "multicode_k": 1,
      "output_norm": 10.687965892155965,
      "output_norm/layer0": 10.687965892155965,
      "step": 2550
    },
    {
      "MSE": 713.9484742228188,
      "MSE/layer0": 713.9484742228188,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.27,
      "input_norm": 31.997940645217888,
      "input_norm/layer0": 31.997940645217888,
      "learning_rate": 0.00038947368421052633,
      "loss": 2.0747,
      "max_norm": 54.81391525268555,
      "max_norm/layer0": 54.81391525268555,
      "mean_norm": 47.6934928894043,
      "mean_norm/layer0": 47.6934928894043,
      "multicode_k": 1,
      "output_norm": 10.762619382540386,
      "output_norm/layer0": 10.762619382540386,
      "step": 2600
    },
    {
      "MSE": 711.9854763793942,
      "MSE/layer0": 711.9854763793942,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.28,
      "input_norm": 31.997925097147615,
      "input_norm/layer0": 31.997925097147615,
      "learning_rate": 0.00038684210526315787,
      "loss": 2.0679,
      "max_norm": 55.21110916137695,
      "max_norm/layer0": 55.21110916137695,
      "mean_norm": 48.01936340332031,
      "mean_norm/layer0": 48.01936340332031,
      "multicode_k": 1,
      "output_norm": 10.838534935315447,
      "output_norm/layer0": 10.838534935315447,
      "step": 2650
    },
    {
      "MSE": 710.4415082804362,
      "MSE/layer0": 710.4415082804362,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.28,
      "input_norm": 31.997930930455517,
      "input_norm/layer0": 31.997930930455517,
      "learning_rate": 0.00038421052631578946,
      "loss": 2.0619,
      "max_norm": 55.63144302368164,
      "max_norm/layer0": 55.63144302368164,
      "mean_norm": 48.34212875366211,
      "mean_norm/layer0": 48.34212875366211,
      "multicode_k": 1,
      "output_norm": 10.893479135831196,
      "output_norm/layer0": 10.893479135831196,
      "step": 2700
    },
    {
      "MSE": 708.5378164672845,
      "MSE/layer0": 708.5378164672845,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.29,
      "input_norm": 31.99792820294698,
      "input_norm/layer0": 31.99792820294698,
      "learning_rate": 0.00038157894736842105,
      "loss": 2.0461,
      "max_norm": 56.01336669921875,
      "max_norm/layer0": 56.01336669921875,
      "mean_norm": 48.66323280334473,
      "mean_norm/layer0": 48.66323280334473,
      "multicode_k": 1,
      "output_norm": 10.971131575902309,
      "output_norm/layer0": 10.971131575902309,
      "step": 2750
    },
    {
      "MSE": 706.6155220540361,
      "MSE/layer0": 706.6155220540361,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.29,
      "input_norm": 31.997930272420245,
      "input_norm/layer0": 31.997930272420245,
      "learning_rate": 0.00037894736842105265,
      "loss": 2.0594,
      "max_norm": 56.40309143066406,
      "max_norm/layer0": 56.40309143066406,
      "mean_norm": 48.980411529541016,
      "mean_norm/layer0": 48.980411529541016,
      "multicode_k": 1,
      "output_norm": 11.042961815198257,
      "output_norm/layer0": 11.042961815198257,
      "step": 2800
    },
    {
      "MSE": 704.6534555053711,
      "MSE/layer0": 704.6534555053711,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.3,
      "input_norm": 31.99792085011799,
      "input_norm/layer0": 31.99792085011799,
      "learning_rate": 0.00037631578947368424,
      "loss": 2.0499,
      "max_norm": 56.79050064086914,
      "max_norm/layer0": 56.79050064086914,
      "mean_norm": 49.293588638305664,
      "mean_norm/layer0": 49.293588638305664,
      "multicode_k": 1,
      "output_norm": 11.11463791847229,
      "output_norm/layer0": 11.11463791847229,
      "step": 2850
    },
    {
      "MSE": 702.691480916341,
      "MSE/layer0": 702.691480916341,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.3,
      "input_norm": 31.997921177546203,
      "input_norm/layer0": 31.997921177546203,
      "learning_rate": 0.0003736842105263158,
      "loss": 2.0472,
      "max_norm": 57.16228103637695,
      "max_norm/layer0": 57.16228103637695,
      "mean_norm": 49.60378646850586,
      "mean_norm/layer0": 49.60378646850586,
      "multicode_k": 1,
      "output_norm": 11.188902417818706,
      "output_norm/layer0": 11.188902417818706,
      "step": 2900
    },
    {
      "MSE": 700.9804660034181,
      "MSE/layer0": 700.9804660034181,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.31,
      "input_norm": 31.997924566268914,
      "input_norm/layer0": 31.997924566268914,
      "learning_rate": 0.00037105263157894737,
      "loss": 2.0557,
      "max_norm": 57.52459716796875,
      "max_norm/layer0": 57.52459716796875,
      "mean_norm": 49.91103553771973,
      "mean_norm/layer0": 49.91103553771973,
      "multicode_k": 1,
      "output_norm": 11.253552745183304,
      "output_norm/layer0": 11.253552745183304,
      "step": 2950
    },
    {
      "MSE": 699.5130490112299,
      "MSE/layer0": 699.5130490112299,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.31,
      "input_norm": 31.997922519048053,
      "input_norm/layer0": 31.997922519048053,
      "learning_rate": 0.00036842105263157896,
      "loss": 2.0439,
      "max_norm": 57.87739562988281,
      "max_norm/layer0": 57.87739562988281,
      "mean_norm": 50.21486854553223,
      "mean_norm/layer0": 50.21486854553223,
      "multicode_k": 1,
      "output_norm": 11.316310184796652,
      "output_norm/layer0": 11.316310184796652,
      "step": 3000
    },
    {
      "epoch": 0.31,
      "eval_MSE/layer0": 698.7265792011616,
      "eval_accuracy": 0.5184875063671823,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997919895214224,
      "eval_loss": 2.0482470989227295,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 11.359921689315088,
      "eval_runtime": 74.2109,
      "eval_samples_per_second": 62.295,
      "eval_steps_per_second": 7.789,
      "step": 3000
    },
    {
      "MSE": 697.8663801066077,
      "MSE/layer0": 697.8663801066077,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.32,
      "input_norm": 31.997911771138504,
      "input_norm/layer0": 31.997911771138504,
      "learning_rate": 0.00036578947368421055,
      "loss": 2.0511,
      "max_norm": 58.24200439453125,
      "max_norm/layer0": 58.24200439453125,
      "mean_norm": 50.51446723937988,
      "mean_norm/layer0": 50.51446723937988,
      "multicode_k": 1,
      "output_norm": 11.388139980634046,
      "output_norm/layer0": 11.388139980634046,
      "step": 3050
    },
    {
      "MSE": 696.0450835164395,
      "MSE/layer0": 696.0450835164395,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.32,
      "input_norm": 31.9979209582011,
      "input_norm/layer0": 31.9979209582011,
      "learning_rate": 0.00036315789473684214,
      "loss": 2.0466,
      "max_norm": 58.58406066894531,
      "max_norm/layer0": 58.58406066894531,
      "mean_norm": 50.81120681762695,
      "mean_norm/layer0": 50.81120681762695,
      "multicode_k": 1,
      "output_norm": 11.455551563898727,
      "output_norm/layer0": 11.455551563898727,
      "step": 3100
    },
    {
      "MSE": 694.5301999918622,
      "MSE/layer0": 694.5301999918622,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.33,
      "input_norm": 31.99790574709574,
      "input_norm/layer0": 31.99790574709574,
      "learning_rate": 0.0003605263157894737,
      "loss": 2.0294,
      "max_norm": 58.931087493896484,
      "max_norm/layer0": 58.931087493896484,
      "mean_norm": 51.104164123535156,
      "mean_norm/layer0": 51.104164123535156,
      "multicode_k": 1,
      "output_norm": 11.512675134340917,
      "output_norm/layer0": 11.512675134340917,
      "step": 3150
    },
    {
      "MSE": 692.5095411173497,
      "MSE/layer0": 692.5095411173497,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.33,
      "input_norm": 31.997909634908044,
      "input_norm/layer0": 31.997909634908044,
      "learning_rate": 0.0003578947368421053,
      "loss": 2.0455,
      "max_norm": 59.2867546081543,
      "max_norm/layer0": 59.2867546081543,
      "mean_norm": 51.39415168762207,
      "mean_norm/layer0": 51.39415168762207,
      "multicode_k": 1,
      "output_norm": 11.587491785685224,
      "output_norm/layer0": 11.587491785685224,
      "step": 3200
    },
    {
      "MSE": 691.1425885009767,
      "MSE/layer0": 691.1425885009767,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.34,
      "input_norm": 31.99791768709818,
      "input_norm/layer0": 31.99791768709818,
      "learning_rate": 0.00035526315789473687,
      "loss": 2.0348,
      "max_norm": 59.64825439453125,
      "max_norm/layer0": 59.64825439453125,
      "mean_norm": 51.68109130859375,
      "mean_norm/layer0": 51.68109130859375,
      "multicode_k": 1,
      "output_norm": 11.643148959477745,
      "output_norm/layer0": 11.643148959477745,
      "step": 3250
    },
    {
      "MSE": 689.2906094360355,
      "MSE/layer0": 689.2906094360355,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.34,
      "input_norm": 31.997913980483997,
      "input_norm/layer0": 31.997913980483997,
      "learning_rate": 0.0003526315789473684,
      "loss": 2.0293,
      "max_norm": 59.97624206542969,
      "max_norm/layer0": 59.97624206542969,
      "mean_norm": 51.965484619140625,
      "mean_norm/layer0": 51.965484619140625,
      "multicode_k": 1,
      "output_norm": 11.714975148836775,
      "output_norm/layer0": 11.714975148836775,
      "step": 3300
    },
    {
      "MSE": 688.0525922648112,
      "MSE/layer0": 688.0525922648112,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.35,
      "input_norm": 31.997908350626624,
      "input_norm/layer0": 31.997908350626624,
      "learning_rate": 0.00035,
      "loss": 2.0389,
      "max_norm": 60.30556869506836,
      "max_norm/layer0": 60.30556869506836,
      "mean_norm": 52.2458438873291,
      "mean_norm/layer0": 52.2458438873291,
      "multicode_k": 1,
      "output_norm": 11.772027517954506,
      "output_norm/layer0": 11.772027517954506,
      "step": 3350
    },
    {
      "MSE": 686.4814953613279,
      "MSE/layer0": 686.4814953613279,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.35,
      "input_norm": 31.997902415593472,
      "input_norm/layer0": 31.997902415593472,
      "learning_rate": 0.0003473684210526316,
      "loss": 2.0266,
      "max_norm": 60.628334045410156,
      "max_norm/layer0": 60.628334045410156,
      "mean_norm": 52.522024154663086,
      "mean_norm/layer0": 52.522024154663086,
      "multicode_k": 1,
      "output_norm": 11.842156640688584,
      "output_norm/layer0": 11.842156640688584,
      "step": 3400
    },
    {
      "MSE": 684.6515231323242,
      "MSE/layer0": 684.6515231323242,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.36,
      "input_norm": 31.99791290283203,
      "input_norm/layer0": 31.99791290283203,
      "learning_rate": 0.0003447368421052632,
      "loss": 2.0248,
      "max_norm": 60.95072555541992,
      "max_norm/layer0": 60.95072555541992,
      "mean_norm": 52.79400825500488,
      "mean_norm/layer0": 52.79400825500488,
      "multicode_k": 1,
      "output_norm": 11.907371897697445,
      "output_norm/layer0": 11.907371897697445,
      "step": 3450
    },
    {
      "MSE": 683.5430062866212,
      "MSE/layer0": 683.5430062866212,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.37,
      "input_norm": 31.9979167175293,
      "input_norm/layer0": 31.9979167175293,
      "learning_rate": 0.00034210526315789477,
      "loss": 2.0263,
      "max_norm": 61.270816802978516,
      "max_norm/layer0": 61.270816802978516,
      "mean_norm": 53.06429481506348,
      "mean_norm/layer0": 53.06429481506348,
      "multicode_k": 1,
      "output_norm": 11.956860675811765,
      "output_norm/layer0": 11.956860675811765,
      "step": 3500
    },
    {
      "epoch": 0.37,
      "eval_MSE/layer0": 682.2680427869782,
      "eval_accuracy": 0.5224062440993215,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997916449774355,
      "eval_loss": 2.0253396034240723,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 12.010468493388789,
      "eval_runtime": 73.2716,
      "eval_samples_per_second": 63.094,
      "eval_steps_per_second": 7.888,
      "step": 3500
    },
    {
      "MSE": 682.0599540201822,
      "MSE/layer0": 682.0599540201822,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.37,
      "input_norm": 31.9979091612498,
      "input_norm/layer0": 31.9979091612498,
      "learning_rate": 0.0003394736842105263,
      "loss": 2.035,
      "max_norm": 61.60363006591797,
      "max_norm/layer0": 61.60363006591797,
      "mean_norm": 53.33056831359863,
      "mean_norm/layer0": 53.33056831359863,
      "multicode_k": 1,
      "output_norm": 12.018342121442167,
      "output_norm/layer0": 12.018342121442167,
      "step": 3550
    },
    {
      "MSE": 680.5750654093424,
      "MSE/layer0": 680.5750654093424,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.38,
      "input_norm": 31.997909587224328,
      "input_norm/layer0": 31.997909587224328,
      "learning_rate": 0.0003368421052631579,
      "loss": 2.0232,
      "max_norm": 61.922420501708984,
      "max_norm/layer0": 61.922420501708984,
      "mean_norm": 53.59366035461426,
      "mean_norm/layer0": 53.59366035461426,
      "multicode_k": 1,
      "output_norm": 12.078021968205773,
      "output_norm/layer0": 12.078021968205773,
      "step": 3600
    },
    {
      "MSE": 678.8478289794925,
      "MSE/layer0": 678.8478289794925,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.38,
      "input_norm": 31.99789888381958,
      "input_norm/layer0": 31.99789888381958,
      "learning_rate": 0.00033421052631578944,
      "loss": 2.0171,
      "max_norm": 62.24449157714844,
      "max_norm/layer0": 62.24449157714844,
      "mean_norm": 53.85357475280762,
      "mean_norm/layer0": 53.85357475280762,
      "multicode_k": 1,
      "output_norm": 12.149001522064214,
      "output_norm/layer0": 12.149001522064214,
      "step": 3650
    },
    {
      "MSE": 677.7631386311848,
      "MSE/layer0": 677.7631386311848,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.39,
      "input_norm": 31.997902571360274,
      "input_norm/layer0": 31.997902571360274,
      "learning_rate": 0.00033157894736842103,
      "loss": 2.0212,
      "max_norm": 62.564937591552734,
      "max_norm/layer0": 62.564937591552734,
      "mean_norm": 54.10923385620117,
      "mean_norm/layer0": 54.10923385620117,
      "multicode_k": 1,
      "output_norm": 12.200160818099977,
      "output_norm/layer0": 12.200160818099977,
      "step": 3700
    },
    {
      "MSE": 676.4079176839191,
      "MSE/layer0": 676.4079176839191,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.39,
      "input_norm": 31.99789404869079,
      "input_norm/layer0": 31.99789404869079,
      "learning_rate": 0.0003289473684210527,
      "loss": 2.0184,
      "max_norm": 62.88063430786133,
      "max_norm/layer0": 62.88063430786133,
      "mean_norm": 54.362863540649414,
      "mean_norm/layer0": 54.362863540649414,
      "multicode_k": 1,
      "output_norm": 12.259288868904115,
      "output_norm/layer0": 12.259288868904115,
      "step": 3750
    },
    {
      "MSE": 675.2395422363282,
      "MSE/layer0": 675.2395422363282,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.4,
      "input_norm": 31.99789286295573,
      "input_norm/layer0": 31.99789286295573,
      "learning_rate": 0.0003263157894736842,
      "loss": 2.0058,
      "max_norm": 63.18323516845703,
      "max_norm/layer0": 63.18323516845703,
      "mean_norm": 54.61160659790039,
      "mean_norm/layer0": 54.61160659790039,
      "multicode_k": 1,
      "output_norm": 12.305311093330385,
      "output_norm/layer0": 12.305311093330385,
      "step": 3800
    },
    {
      "MSE": 673.5289611816404,
      "MSE/layer0": 673.5289611816404,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.4,
      "input_norm": 31.997895905176787,
      "input_norm/layer0": 31.997895905176787,
      "learning_rate": 0.0003236842105263158,
      "loss": 2.0147,
      "max_norm": 63.47829055786133,
      "max_norm/layer0": 63.47829055786133,
      "mean_norm": 54.85733413696289,
      "mean_norm/layer0": 54.85733413696289,
      "multicode_k": 1,
      "output_norm": 12.368880640665692,
      "output_norm/layer0": 12.368880640665692,
      "step": 3850
    },
    {
      "MSE": 672.7262348429363,
      "MSE/layer0": 672.7262348429363,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.41,
      "input_norm": 31.997892808914187,
      "input_norm/layer0": 31.997892808914187,
      "learning_rate": 0.0003210526315789474,
      "loss": 2.0011,
      "max_norm": 63.7920036315918,
      "max_norm/layer0": 63.7920036315918,
      "mean_norm": 55.099992752075195,
      "mean_norm/layer0": 55.099992752075195,
      "multicode_k": 1,
      "output_norm": 12.413625540733335,
      "output_norm/layer0": 12.413625540733335,
      "step": 3900
    },
    {
      "MSE": 671.2364042154949,
      "MSE/layer0": 671.2364042154949,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.41,
      "input_norm": 31.997892484664916,
      "input_norm/layer0": 31.997892484664916,
      "learning_rate": 0.00031842105263157894,
      "loss": 2.0068,
      "max_norm": 64.07488250732422,
      "max_norm/layer0": 64.07488250732422,
      "mean_norm": 55.33942985534668,
      "mean_norm/layer0": 55.33942985534668,
      "multicode_k": 1,
      "output_norm": 12.478335504531861,
      "output_norm/layer0": 12.478335504531861,
      "step": 3950
    },
    {
      "MSE": 669.9738427734378,
      "MSE/layer0": 669.9738427734378,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.42,
      "input_norm": 31.997889916102086,
      "input_norm/layer0": 31.997889916102086,
      "learning_rate": 0.00031578947368421053,
      "loss": 1.9906,
      "max_norm": 64.34879302978516,
      "max_norm/layer0": 64.34879302978516,
      "mean_norm": 55.576541900634766,
      "mean_norm/layer0": 55.576541900634766,
      "multicode_k": 1,
      "output_norm": 12.524646544456482,
      "output_norm/layer0": 12.524646544456482,
      "step": 4000
    },
    {
      "epoch": 0.42,
      "eval_MSE/layer0": 669.1965223770751,
      "eval_accuracy": 0.5253332978103237,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997898890449704,
      "eval_loss": 2.006638526916504,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 12.556819209953474,
      "eval_runtime": 73.3751,
      "eval_samples_per_second": 63.005,
      "eval_steps_per_second": 7.877,
      "step": 4000
    },
    {
      "MSE": 668.3390091959637,
      "MSE/layer0": 668.3390091959637,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.42,
      "input_norm": 31.99788640658062,
      "input_norm/layer0": 31.99788640658062,
      "learning_rate": 0.00031315789473684207,
      "loss": 1.9962,
      "max_norm": 64.65262603759766,
      "max_norm/layer0": 64.65262603759766,
      "mean_norm": 55.811140060424805,
      "mean_norm/layer0": 55.811140060424805,
      "multicode_k": 1,
      "output_norm": 12.584023051261894,
      "output_norm/layer0": 12.584023051261894,
      "step": 4050
    },
    {
      "MSE": 667.4144735717773,
      "MSE/layer0": 667.4144735717773,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.43,
      "input_norm": 31.99788414637247,
      "input_norm/layer0": 31.99788414637247,
      "learning_rate": 0.0003105263157894737,
      "loss": 2.0038,
      "max_norm": 64.9332275390625,
      "max_norm/layer0": 64.9332275390625,
      "mean_norm": 56.04119682312012,
      "mean_norm/layer0": 56.04119682312012,
      "multicode_k": 1,
      "output_norm": 12.633416105906175,
      "output_norm/layer0": 12.633416105906175,
      "step": 4100
    },
    {
      "MSE": 666.502211812337,
      "MSE/layer0": 666.502211812337,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.43,
      "input_norm": 31.997885338465373,
      "input_norm/layer0": 31.997885338465373,
      "learning_rate": 0.0003078947368421053,
      "loss": 2.0046,
      "max_norm": 65.20265197753906,
      "max_norm/layer0": 65.20265197753906,
      "mean_norm": 56.26777458190918,
      "mean_norm/layer0": 56.26777458190918,
      "multicode_k": 1,
      "output_norm": 12.67455391089122,
      "output_norm/layer0": 12.67455391089122,
      "step": 4150
    },
    {
      "MSE": 665.0832258097332,
      "MSE/layer0": 665.0832258097332,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.44,
      "input_norm": 31.997875661849967,
      "input_norm/layer0": 31.997875661849967,
      "learning_rate": 0.00030526315789473684,
      "loss": 2.0066,
      "max_norm": 65.46887969970703,
      "max_norm/layer0": 65.46887969970703,
      "mean_norm": 56.49208450317383,
      "mean_norm/layer0": 56.49208450317383,
      "multicode_k": 1,
      "output_norm": 12.73067569255829,
      "output_norm/layer0": 12.73067569255829,
      "step": 4200
    },
    {
      "MSE": 663.9124774169925,
      "MSE/layer0": 663.9124774169925,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.44,
      "input_norm": 31.997874129613244,
      "input_norm/layer0": 31.997874129613244,
      "learning_rate": 0.00030263157894736844,
      "loss": 2.0006,
      "max_norm": 65.73078918457031,
      "max_norm/layer0": 65.73078918457031,
      "mean_norm": 56.712989807128906,
      "mean_norm/layer0": 56.712989807128906,
      "multicode_k": 1,
      "output_norm": 12.783326719601945,
      "output_norm/layer0": 12.783326719601945,
      "step": 4250
    },
    {
      "MSE": 663.0191631062823,
      "MSE/layer0": 663.0191631062823,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.45,
      "input_norm": 31.99787082672119,
      "input_norm/layer0": 31.99787082672119,
      "learning_rate": 0.0003,
      "loss": 1.9862,
      "max_norm": 65.99481964111328,
      "max_norm/layer0": 65.99481964111328,
      "mean_norm": 56.93141746520996,
      "mean_norm/layer0": 56.93141746520996,
      "multicode_k": 1,
      "output_norm": 12.824343484242757,
      "output_norm/layer0": 12.824343484242757,
      "step": 4300
    },
    {
      "MSE": 661.9175501505531,
      "MSE/layer0": 661.9175501505531,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.45,
      "input_norm": 31.997863101959226,
      "input_norm/layer0": 31.997863101959226,
      "learning_rate": 0.00029736842105263157,
      "loss": 1.9891,
      "max_norm": 66.25289916992188,
      "max_norm/layer0": 66.25289916992188,
      "mean_norm": 57.14705848693848,
      "mean_norm/layer0": 57.14705848693848,
      "multicode_k": 1,
      "output_norm": 12.873331023852028,
      "output_norm/layer0": 12.873331023852028,
      "step": 4350
    },
    {
      "MSE": 660.8278486124677,
      "MSE/layer0": 660.8278486124677,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.46,
      "input_norm": 31.99786113739014,
      "input_norm/layer0": 31.99786113739014,
      "learning_rate": 0.00029473684210526316,
      "loss": 1.9874,
      "max_norm": 66.49950408935547,
      "max_norm/layer0": 66.49950408935547,
      "mean_norm": 57.3592414855957,
      "mean_norm/layer0": 57.3592414855957,
      "multicode_k": 1,
      "output_norm": 12.925755645434062,
      "output_norm/layer0": 12.925755645434062,
      "step": 4400
    },
    {
      "MSE": 659.7812182617188,
      "MSE/layer0": 659.7812182617188,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.46,
      "input_norm": 31.997859818140668,
      "input_norm/layer0": 31.997859818140668,
      "learning_rate": 0.00029210526315789475,
      "loss": 1.9894,
      "max_norm": 66.74647521972656,
      "max_norm/layer0": 66.74647521972656,
      "mean_norm": 57.56860542297363,
      "mean_norm/layer0": 57.56860542297363,
      "multicode_k": 1,
      "output_norm": 12.969949612617494,
      "output_norm/layer0": 12.969949612617494,
      "step": 4450
    },
    {
      "MSE": 658.2862462361654,
      "MSE/layer0": 658.2862462361654,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.47,
      "input_norm": 31.997855517069482,
      "input_norm/layer0": 31.997855517069482,
      "learning_rate": 0.00028947368421052634,
      "loss": 1.9852,
      "max_norm": 67.0057373046875,
      "max_norm/layer0": 67.0057373046875,
      "mean_norm": 57.77582931518555,
      "mean_norm/layer0": 57.77582931518555,
      "multicode_k": 1,
      "output_norm": 13.019407332738238,
      "output_norm/layer0": 13.019407332738238,
      "step": 4500
    },
    {
      "epoch": 0.47,
      "eval_MSE/layer0": 657.5871718611108,
      "eval_accuracy": 0.5279040641917702,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997854675071842,
      "eval_loss": 1.9898165464401245,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 13.052642994207561,
      "eval_runtime": 74.0479,
      "eval_samples_per_second": 62.433,
      "eval_steps_per_second": 7.806,
      "step": 4500
    },
    {
      "MSE": 657.2974259440105,
      "MSE/layer0": 657.2974259440105,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.48,
      "input_norm": 31.99785115559897,
      "input_norm/layer0": 31.99785115559897,
      "learning_rate": 0.0002868421052631579,
      "loss": 1.9727,
      "max_norm": 67.25566101074219,
      "max_norm/layer0": 67.25566101074219,
      "mean_norm": 57.98077964782715,
      "mean_norm/layer0": 57.98077964782715,
      "multicode_k": 1,
      "output_norm": 13.063522001902262,
      "output_norm/layer0": 13.063522001902262,
      "step": 4550
    },
    {
      "MSE": 656.5759895833334,
      "MSE/layer0": 656.5759895833334,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.48,
      "input_norm": 31.997858088811242,
      "input_norm/layer0": 31.997858088811242,
      "learning_rate": 0.00028421052631578947,
      "loss": 1.9897,
      "max_norm": 67.49605560302734,
      "max_norm/layer0": 67.49605560302734,
      "mean_norm": 58.182559967041016,
      "mean_norm/layer0": 58.182559967041016,
      "multicode_k": 1,
      "output_norm": 13.099744346936546,
      "output_norm/layer0": 13.099744346936546,
      "step": 4600
    },
    {
      "MSE": 655.8373800659178,
      "MSE/layer0": 655.8373800659178,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.49,
      "input_norm": 31.997857850392663,
      "input_norm/layer0": 31.997857850392663,
      "learning_rate": 0.00028157894736842106,
      "loss": 1.9918,
      "max_norm": 67.72962188720703,
      "max_norm/layer0": 67.72962188720703,
      "mean_norm": 58.38115119934082,
      "mean_norm/layer0": 58.38115119934082,
      "multicode_k": 1,
      "output_norm": 13.13247790972392,
      "output_norm/layer0": 13.13247790972392,
      "step": 4650
    },
    {
      "MSE": 654.6057424926755,
      "MSE/layer0": 654.6057424926755,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.49,
      "input_norm": 31.997855739593504,
      "input_norm/layer0": 31.997855739593504,
      "learning_rate": 0.0002789473684210526,
      "loss": 1.9908,
      "max_norm": 67.96855163574219,
      "max_norm/layer0": 67.96855163574219,
      "mean_norm": 58.57722091674805,
      "mean_norm/layer0": 58.57722091674805,
      "multicode_k": 1,
      "output_norm": 13.187800091107682,
      "output_norm/layer0": 13.187800091107682,
      "step": 4700
    },
    {
      "MSE": 653.7336292521161,
      "MSE/layer0": 653.7336292521161,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.5,
      "input_norm": 31.997861677805588,
      "input_norm/layer0": 31.997861677805588,
      "learning_rate": 0.00027631578947368425,
      "loss": 1.9919,
      "max_norm": 68.20356750488281,
      "max_norm/layer0": 68.20356750488281,
      "mean_norm": 58.77041053771973,
      "mean_norm/layer0": 58.77041053771973,
      "multicode_k": 1,
      "output_norm": 13.224705770810434,
      "output_norm/layer0": 13.224705770810434,
      "step": 4750
    },
    {
      "MSE": 652.4711893717447,
      "MSE/layer0": 652.4711893717447,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.5,
      "input_norm": 31.997852430343634,
      "input_norm/layer0": 31.997852430343634,
      "learning_rate": 0.00027368421052631584,
      "loss": 1.9777,
      "max_norm": 68.42557525634766,
      "max_norm/layer0": 68.42557525634766,
      "mean_norm": 58.96235466003418,
      "mean_norm/layer0": 58.96235466003418,
      "multicode_k": 1,
      "output_norm": 13.275700616836549,
      "output_norm/layer0": 13.275700616836549,
      "step": 4800
    },
    {
      "MSE": 651.660216674805,
      "MSE/layer0": 651.660216674805,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.51,
      "input_norm": 31.997857831319166,
      "input_norm/layer0": 31.997857831319166,
      "learning_rate": 0.0002710526315789474,
      "loss": 1.9728,
      "max_norm": 68.6562271118164,
      "max_norm/layer0": 68.6562271118164,
      "mean_norm": 59.151214599609375,
      "mean_norm/layer0": 59.151214599609375,
      "multicode_k": 1,
      "output_norm": 13.316913062731425,
      "output_norm/layer0": 13.316913062731425,
      "step": 4850
    },
    {
      "MSE": 651.1180463663741,
      "MSE/layer0": 651.1180463663741,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.51,
      "input_norm": 31.997851276397704,
      "input_norm/layer0": 31.997851276397704,
      "learning_rate": 0.00026842105263157897,
      "loss": 1.9806,
      "max_norm": 68.8842544555664,
      "max_norm/layer0": 68.8842544555664,
      "mean_norm": 59.336891174316406,
      "mean_norm/layer0": 59.336891174316406,
      "multicode_k": 1,
      "output_norm": 13.348248120943708,
      "output_norm/layer0": 13.348248120943708,
      "step": 4900
    },
    {
      "MSE": 650.0774853515621,
      "MSE/layer0": 650.0774853515621,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.52,
      "input_norm": 31.997846142450957,
      "input_norm/layer0": 31.997846142450957,
      "learning_rate": 0.0002657894736842105,
      "loss": 1.9718,
      "max_norm": 69.09481811523438,
      "max_norm/layer0": 69.09481811523438,
      "mean_norm": 59.52014923095703,
      "mean_norm/layer0": 59.52014923095703,
      "multicode_k": 1,
      "output_norm": 13.38570951779683,
      "output_norm/layer0": 13.38570951779683,
      "step": 4950
    },
    {
      "MSE": 649.2541728719073,
      "MSE/layer0": 649.2541728719073,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.52,
      "input_norm": 31.997852964401247,
      "input_norm/layer0": 31.997852964401247,
      "learning_rate": 0.0002631578947368421,
      "loss": 1.9687,
      "max_norm": 69.3100357055664,
      "max_norm/layer0": 69.3100357055664,
      "mean_norm": 59.70068359375,
      "mean_norm/layer0": 59.70068359375,
      "multicode_k": 1,
      "output_norm": 13.423000381787617,
      "output_norm/layer0": 13.423000381787617,
      "step": 5000
    },
    {
      "epoch": 0.52,
      "eval_MSE/layer0": 648.246248562512,
      "eval_accuracy": 0.5299863891896716,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997853133679993,
      "eval_loss": 1.975706934928894,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 13.449585199510798,
      "eval_runtime": 73.7352,
      "eval_samples_per_second": 62.697,
      "eval_steps_per_second": 7.839,
      "step": 5000
    },
    {
      "MSE": 648.4500269571938,
      "MSE/layer0": 648.4500269571938,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.53,
      "input_norm": 31.99784724235535,
      "input_norm/layer0": 31.99784724235535,
      "learning_rate": 0.0002605263157894737,
      "loss": 1.9816,
      "max_norm": 69.5140151977539,
      "max_norm/layer0": 69.5140151977539,
      "mean_norm": 59.87860107421875,
      "mean_norm/layer0": 59.87860107421875,
      "multicode_k": 1,
      "output_norm": 13.459953915278113,
      "output_norm/layer0": 13.459953915278113,
      "step": 5050
    },
    {
      "MSE": 647.5120207722985,
      "MSE/layer0": 647.5120207722985,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.53,
      "input_norm": 31.997845083872484,
      "input_norm/layer0": 31.997845083872484,
      "learning_rate": 0.0002578947368421053,
      "loss": 1.9778,
      "max_norm": 69.72222137451172,
      "max_norm/layer0": 69.72222137451172,
      "mean_norm": 60.054636001586914,
      "mean_norm/layer0": 60.054636001586914,
      "multicode_k": 1,
      "output_norm": 13.495457221666976,
      "output_norm/layer0": 13.495457221666976,
      "step": 5100
    },
    {
      "MSE": 646.8909526570638,
      "MSE/layer0": 646.8909526570638,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.54,
      "input_norm": 31.99783927281696,
      "input_norm/layer0": 31.99783927281696,
      "learning_rate": 0.0002552631578947369,
      "loss": 1.9608,
      "max_norm": 69.93621826171875,
      "max_norm/layer0": 69.93621826171875,
      "mean_norm": 60.228532791137695,
      "mean_norm/layer0": 60.228532791137695,
      "multicode_k": 1,
      "output_norm": 13.523821023305253,
      "output_norm/layer0": 13.523821023305253,
      "step": 5150
    },
    {
      "MSE": 645.6001059977214,
      "MSE/layer0": 645.6001059977214,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.54,
      "input_norm": 31.997829329172767,
      "input_norm/layer0": 31.997829329172767,
      "learning_rate": 0.0002526315789473684,
      "loss": 1.9514,
      "max_norm": 70.1629867553711,
      "max_norm/layer0": 70.1629867553711,
      "mean_norm": 60.39993667602539,
      "mean_norm/layer0": 60.39993667602539,
      "multicode_k": 1,
      "output_norm": 13.575601536432904,
      "output_norm/layer0": 13.575601536432904,
      "step": 5200
    },
    {
      "MSE": 645.0477313232423,
      "MSE/layer0": 645.0477313232423,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.55,
      "input_norm": 31.997829844156904,
      "input_norm/layer0": 31.997829844156904,
      "learning_rate": 0.00025,
      "loss": 1.953,
      "max_norm": 70.36659240722656,
      "max_norm/layer0": 70.36659240722656,
      "mean_norm": 60.568695068359375,
      "mean_norm/layer0": 60.568695068359375,
      "multicode_k": 1,
      "output_norm": 13.606370126406352,
      "output_norm/layer0": 13.606370126406352,
      "step": 5250
    },
    {
      "MSE": 644.0795441691082,
      "MSE/layer0": 644.0795441691082,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.55,
      "input_norm": 31.997827720642086,
      "input_norm/layer0": 31.997827720642086,
      "learning_rate": 0.0002473684210526316,
      "loss": 1.9664,
      "max_norm": 70.58203125,
      "max_norm/layer0": 70.58203125,
      "mean_norm": 60.73503303527832,
      "mean_norm/layer0": 60.73503303527832,
      "multicode_k": 1,
      "output_norm": 13.644356350898736,
      "output_norm/layer0": 13.644356350898736,
      "step": 5300
    },
    {
      "MSE": 643.4398297119142,
      "MSE/layer0": 643.4398297119142,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.56,
      "input_norm": 31.99783255259196,
      "input_norm/layer0": 31.99783255259196,
      "learning_rate": 0.0002447368421052632,
      "loss": 1.9612,
      "max_norm": 70.80116271972656,
      "max_norm/layer0": 70.80116271972656,
      "mean_norm": 60.89903450012207,
      "mean_norm/layer0": 60.89903450012207,
      "multicode_k": 1,
      "output_norm": 13.676611545880633,
      "output_norm/layer0": 13.676611545880633,
      "step": 5350
    },
    {
      "MSE": 642.6565199788413,
      "MSE/layer0": 642.6565199788413,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.56,
      "input_norm": 31.997826932271334,
      "input_norm/layer0": 31.997826932271334,
      "learning_rate": 0.00024210526315789475,
      "loss": 1.9695,
      "max_norm": 71.0198745727539,
      "max_norm/layer0": 71.0198745727539,
      "mean_norm": 61.06051063537598,
      "mean_norm/layer0": 61.06051063537598,
      "multicode_k": 1,
      "output_norm": 13.705395914713542,
      "output_norm/layer0": 13.705395914713542,
      "step": 5400
    },
    {
      "MSE": 641.5518863932293,
      "MSE/layer0": 641.5518863932293,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.57,
      "input_norm": 31.99782320658366,
      "input_norm/layer0": 31.99782320658366,
      "learning_rate": 0.00023947368421052632,
      "loss": 1.9708,
      "max_norm": 71.22209930419922,
      "max_norm/layer0": 71.22209930419922,
      "mean_norm": 61.22001647949219,
      "mean_norm/layer0": 61.22001647949219,
      "multicode_k": 1,
      "output_norm": 13.747722525596622,
      "output_norm/layer0": 13.747722525596622,
      "step": 5450
    },
    {
      "MSE": 641.0277577718095,
      "MSE/layer0": 641.0277577718095,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.57,
      "input_norm": 31.997817249298095,
      "input_norm/layer0": 31.997817249298095,
      "learning_rate": 0.00023684210526315788,
      "loss": 1.9672,
      "max_norm": 71.42549896240234,
      "max_norm/layer0": 71.42549896240234,
      "mean_norm": 61.377342224121094,
      "mean_norm/layer0": 61.377342224121094,
      "multicode_k": 1,
      "output_norm": 13.775313488642375,
      "output_norm/layer0": 13.775313488642375,
      "step": 5500
    },
    {
      "epoch": 0.57,
      "eval_MSE/layer0": 640.0821653411886,
      "eval_accuracy": 0.5321348969378108,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997811444105338,
      "eval_loss": 1.9619895219802856,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 13.80778875099279,
      "eval_runtime": 73.8101,
      "eval_samples_per_second": 62.634,
      "eval_steps_per_second": 7.831,
      "step": 5500
    },
    {
      "MSE": 640.2260070800783,
      "MSE/layer0": 640.2260070800783,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.58,
      "input_norm": 31.997807060877484,
      "input_norm/layer0": 31.997807060877484,
      "learning_rate": 0.00023421052631578948,
      "loss": 1.9526,
      "max_norm": 71.6324691772461,
      "max_norm/layer0": 71.6324691772461,
      "mean_norm": 61.532691955566406,
      "mean_norm/layer0": 61.532691955566406,
      "multicode_k": 1,
      "output_norm": 13.81434581597646,
      "output_norm/layer0": 13.81434581597646,
      "step": 5550
    },
    {
      "MSE": 639.6603690592448,
      "MSE/layer0": 639.6603690592448,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.58,
      "input_norm": 31.997815796534205,
      "input_norm/layer0": 31.997815796534205,
      "learning_rate": 0.00023157894736842107,
      "loss": 1.9592,
      "max_norm": 71.83050537109375,
      "max_norm/layer0": 71.83050537109375,
      "mean_norm": 61.68556213378906,
      "mean_norm/layer0": 61.68556213378906,
      "multicode_k": 1,
      "output_norm": 13.843803273836771,
      "output_norm/layer0": 13.843803273836771,
      "step": 5600
    },
    {
      "MSE": 638.8630006917316,
      "MSE/layer0": 638.8630006917316,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.59,
      "input_norm": 31.997804651260374,
      "input_norm/layer0": 31.997804651260374,
      "learning_rate": 0.00022894736842105263,
      "loss": 1.9582,
      "max_norm": 72.0186767578125,
      "max_norm/layer0": 72.0186767578125,
      "mean_norm": 61.836381912231445,
      "mean_norm/layer0": 61.836381912231445,
      "multicode_k": 1,
      "output_norm": 13.87206829547882,
      "output_norm/layer0": 13.87206829547882,
      "step": 5650
    },
    {
      "MSE": 638.6114538574218,
      "MSE/layer0": 638.6114538574218,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.6,
      "input_norm": 31.997799615859993,
      "input_norm/layer0": 31.997799615859993,
      "learning_rate": 0.00022631578947368422,
      "loss": 1.9581,
      "max_norm": 72.212158203125,
      "max_norm/layer0": 72.212158203125,
      "mean_norm": 61.984375,
      "mean_norm/layer0": 61.984375,
      "multicode_k": 1,
      "output_norm": 13.890618721644087,
      "output_norm/layer0": 13.890618721644087,
      "step": 5700
    },
    {
      "MSE": 637.4200433349613,
      "MSE/layer0": 637.4200433349613,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.6,
      "input_norm": 31.9977961031596,
      "input_norm/layer0": 31.9977961031596,
      "learning_rate": 0.0002236842105263158,
      "loss": 1.9563,
      "max_norm": 72.40010833740234,
      "max_norm/layer0": 72.40010833740234,
      "mean_norm": 62.13043212890625,
      "mean_norm/layer0": 62.13043212890625,
      "multicode_k": 1,
      "output_norm": 13.935336654980983,
      "output_norm/layer0": 13.935336654980983,
      "step": 5750
    },
    {
      "MSE": 636.9881141153974,
      "MSE/layer0": 636.9881141153974,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.61,
      "input_norm": 31.997795972824097,
      "input_norm/layer0": 31.997795972824097,
      "learning_rate": 0.00022105263157894735,
      "loss": 1.9652,
      "max_norm": 72.58822631835938,
      "max_norm/layer0": 72.58822631835938,
      "mean_norm": 62.274553298950195,
      "mean_norm/layer0": 62.274553298950195,
      "multicode_k": 1,
      "output_norm": 13.960987841288247,
      "output_norm/layer0": 13.960987841288247,
      "step": 5800
    },
    {
      "MSE": 636.22215037028,
      "MSE/layer0": 636.22215037028,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.61,
      "input_norm": 31.997794774373368,
      "input_norm/layer0": 31.997794774373368,
      "learning_rate": 0.00021842105263157897,
      "loss": 1.9509,
      "max_norm": 72.77027130126953,
      "max_norm/layer0": 72.77027130126953,
      "mean_norm": 62.417043685913086,
      "mean_norm/layer0": 62.417043685913086,
      "multicode_k": 1,
      "output_norm": 13.98557560602824,
      "output_norm/layer0": 13.98557560602824,
      "step": 5850
    },
    {
      "MSE": 635.6220120239254,
      "MSE/layer0": 635.6220120239254,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.62,
      "input_norm": 31.997796500523897,
      "input_norm/layer0": 31.997796500523897,
      "learning_rate": 0.00021578947368421054,
      "loss": 1.9637,
      "max_norm": 72.93942260742188,
      "max_norm/layer0": 72.93942260742188,
      "mean_norm": 62.5573787689209,
      "mean_norm/layer0": 62.5573787689209,
      "multicode_k": 1,
      "output_norm": 14.011822309494022,
      "output_norm/layer0": 14.011822309494022,
      "step": 5900
    },
    {
      "MSE": 635.1990796915693,
      "MSE/layer0": 635.1990796915693,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.62,
      "input_norm": 31.99778350830077,
      "input_norm/layer0": 31.99778350830077,
      "learning_rate": 0.0002131578947368421,
      "loss": 1.9417,
      "max_norm": 73.11217498779297,
      "max_norm/layer0": 73.11217498779297,
      "mean_norm": 62.69554328918457,
      "mean_norm/layer0": 62.69554328918457,
      "multicode_k": 1,
      "output_norm": 14.040199557940166,
      "output_norm/layer0": 14.040199557940166,
      "step": 5950
    },
    {
      "MSE": 634.617561645508,
      "MSE/layer0": 634.617561645508,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.63,
      "input_norm": 31.9977766195933,
      "input_norm/layer0": 31.9977766195933,
      "learning_rate": 0.00021052631578947367,
      "loss": 1.9441,
      "max_norm": 73.27617645263672,
      "max_norm/layer0": 73.27617645263672,
      "mean_norm": 62.831491470336914,
      "mean_norm/layer0": 62.831491470336914,
      "multicode_k": 1,
      "output_norm": 14.065582130750016,
      "output_norm/layer0": 14.065582130750016,
      "step": 6000
    },
    {
      "epoch": 0.63,
      "eval_MSE/layer0": 633.8831350106634,
      "eval_accuracy": 0.5338761587531762,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997772803689244,
      "eval_loss": 1.951315999031067,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.101806794000915,
      "eval_runtime": 73.5977,
      "eval_samples_per_second": 62.814,
      "eval_steps_per_second": 7.854,
      "step": 6000
    },
    {
      "MSE": 633.8391249593099,
      "MSE/layer0": 633.8391249593099,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.63,
      "input_norm": 31.99777683258057,
      "input_norm/layer0": 31.99777683258057,
      "learning_rate": 0.0002078947368421053,
      "loss": 1.9507,
      "max_norm": 73.43240356445312,
      "max_norm/layer0": 73.43240356445312,
      "mean_norm": 62.96537971496582,
      "mean_norm/layer0": 62.96537971496582,
      "multicode_k": 1,
      "output_norm": 14.0993266805013,
      "output_norm/layer0": 14.0993266805013,
      "step": 6050
    },
    {
      "MSE": 633.1878758748373,
      "MSE/layer0": 633.1878758748373,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.64,
      "input_norm": 31.997768185933438,
      "input_norm/layer0": 31.997768185933438,
      "learning_rate": 0.00020526315789473685,
      "loss": 1.9535,
      "max_norm": 73.59780883789062,
      "max_norm/layer0": 73.59780883789062,
      "mean_norm": 63.09744453430176,
      "mean_norm/layer0": 63.09744453430176,
      "multicode_k": 1,
      "output_norm": 14.12703340212504,
      "output_norm/layer0": 14.12703340212504,
      "step": 6100
    },
    {
      "MSE": 632.4774736531577,
      "MSE/layer0": 632.4774736531577,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.64,
      "input_norm": 31.997762225468954,
      "input_norm/layer0": 31.997762225468954,
      "learning_rate": 0.00020263157894736842,
      "loss": 1.9502,
      "max_norm": 73.7634506225586,
      "max_norm/layer0": 73.7634506225586,
      "mean_norm": 63.227373123168945,
      "mean_norm/layer0": 63.227373123168945,
      "multicode_k": 1,
      "output_norm": 14.155767776171366,
      "output_norm/layer0": 14.155767776171366,
      "step": 6150
    },
    {
      "MSE": 632.0819724527997,
      "MSE/layer0": 632.0819724527997,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.65,
      "input_norm": 31.997758595148735,
      "input_norm/layer0": 31.997758595148735,
      "learning_rate": 0.0002,
      "loss": 1.948,
      "max_norm": 73.93152618408203,
      "max_norm/layer0": 73.93152618408203,
      "mean_norm": 63.35538673400879,
      "mean_norm/layer0": 63.35538673400879,
      "multicode_k": 1,
      "output_norm": 14.17972202301026,
      "output_norm/layer0": 14.17972202301026,
      "step": 6200
    },
    {
      "MSE": 631.3937511189779,
      "MSE/layer0": 631.3937511189779,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.65,
      "input_norm": 31.997760909398387,
      "input_norm/layer0": 31.997760909398387,
      "learning_rate": 0.00019736842105263157,
      "loss": 1.9449,
      "max_norm": 74.07744598388672,
      "max_norm/layer0": 74.07744598388672,
      "mean_norm": 63.481435775756836,
      "mean_norm/layer0": 63.481435775756836,
      "multicode_k": 1,
      "output_norm": 14.207703741391498,
      "output_norm/layer0": 14.207703741391498,
      "step": 6250
    },
    {
      "MSE": 631.1097898356121,
      "MSE/layer0": 631.1097898356121,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.66,
      "input_norm": 31.997752253214514,
      "input_norm/layer0": 31.997752253214514,
      "learning_rate": 0.00019473684210526317,
      "loss": 1.9256,
      "max_norm": 74.23124694824219,
      "max_norm/layer0": 74.23124694824219,
      "mean_norm": 63.605464935302734,
      "mean_norm/layer0": 63.605464935302734,
      "multicode_k": 1,
      "output_norm": 14.22562705675761,
      "output_norm/layer0": 14.22562705675761,
      "step": 6300
    },
    {
      "MSE": 630.4715811157231,
      "MSE/layer0": 630.4715811157231,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.66,
      "input_norm": 31.99775326093037,
      "input_norm/layer0": 31.99775326093037,
      "learning_rate": 0.00019210526315789473,
      "loss": 1.9394,
      "max_norm": 74.37789154052734,
      "max_norm/layer0": 74.37789154052734,
      "mean_norm": 63.72765922546387,
      "mean_norm/layer0": 63.72765922546387,
      "multicode_k": 1,
      "output_norm": 14.252348532676702,
      "output_norm/layer0": 14.252348532676702,
      "step": 6350
    },
    {
      "MSE": 629.5616383870444,
      "MSE/layer0": 629.5616383870444,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.67,
      "input_norm": 31.9977592086792,
      "input_norm/layer0": 31.9977592086792,
      "learning_rate": 0.00018947368421052632,
      "loss": 1.948,
      "max_norm": 74.52799987792969,
      "max_norm/layer0": 74.52799987792969,
      "mean_norm": 63.84817886352539,
      "mean_norm/layer0": 63.84817886352539,
      "multicode_k": 1,
      "output_norm": 14.278619543711342,
      "output_norm/layer0": 14.278619543711342,
      "step": 6400
    },
    {
      "MSE": 628.9405068969726,
      "MSE/layer0": 628.9405068969726,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.67,
      "input_norm": 31.9977388159434,
      "input_norm/layer0": 31.9977388159434,
      "learning_rate": 0.0001868421052631579,
      "loss": 1.9365,
      "max_norm": 74.66854095458984,
      "max_norm/layer0": 74.66854095458984,
      "mean_norm": 63.96674346923828,
      "mean_norm/layer0": 63.96674346923828,
      "multicode_k": 1,
      "output_norm": 14.308290360768634,
      "output_norm/layer0": 14.308290360768634,
      "step": 6450
    },
    {
      "MSE": 628.8358187866208,
      "MSE/layer0": 628.8358187866208,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.68,
      "input_norm": 31.997742996215806,
      "input_norm/layer0": 31.997742996215806,
      "learning_rate": 0.00018421052631578948,
      "loss": 1.9408,
      "max_norm": 74.80778503417969,
      "max_norm/layer0": 74.80778503417969,
      "mean_norm": 64.08341407775879,
      "mean_norm/layer0": 64.08341407775879,
      "multicode_k": 1,
      "output_norm": 14.319794411659238,
      "output_norm/layer0": 14.319794411659238,
      "step": 6500
    },
    {
      "epoch": 0.68,
      "eval_MSE/layer0": 628.092910030562,
      "eval_accuracy": 0.5357603583933366,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997742160687373,
      "eval_loss": 1.9396723508834839,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.354976222496019,
      "eval_runtime": 73.9338,
      "eval_samples_per_second": 62.529,
      "eval_steps_per_second": 7.818,
      "step": 6500
    },
    {
      "MSE": 628.4872816975908,
      "MSE/layer0": 628.4872816975908,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.68,
      "input_norm": 31.997741378148394,
      "input_norm/layer0": 31.997741378148394,
      "learning_rate": 0.00018157894736842107,
      "loss": 1.9392,
      "max_norm": 74.95079040527344,
      "max_norm/layer0": 74.95079040527344,
      "mean_norm": 64.19818496704102,
      "mean_norm/layer0": 64.19818496704102,
      "multicode_k": 1,
      "output_norm": 14.340212704340617,
      "output_norm/layer0": 14.340212704340617,
      "step": 6550
    },
    {
      "MSE": 627.595106302897,
      "MSE/layer0": 627.595106302897,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.69,
      "input_norm": 31.99773236592611,
      "input_norm/layer0": 31.99773236592611,
      "learning_rate": 0.00017894736842105264,
      "loss": 1.9312,
      "max_norm": 75.08959197998047,
      "max_norm/layer0": 75.08959197998047,
      "mean_norm": 64.3110408782959,
      "mean_norm/layer0": 64.3110408782959,
      "multicode_k": 1,
      "output_norm": 14.375651826858522,
      "output_norm/layer0": 14.375651826858522,
      "step": 6600
    },
    {
      "MSE": 627.2688003540036,
      "MSE/layer0": 627.2688003540036,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.69,
      "input_norm": 31.997724459966015,
      "input_norm/layer0": 31.997724459966015,
      "learning_rate": 0.0001763157894736842,
      "loss": 1.9454,
      "max_norm": 75.23365783691406,
      "max_norm/layer0": 75.23365783691406,
      "mean_norm": 64.42234230041504,
      "mean_norm/layer0": 64.42234230041504,
      "multicode_k": 1,
      "output_norm": 14.385090745290121,
      "output_norm/layer0": 14.385090745290121,
      "step": 6650
    },
    {
      "MSE": 626.5893623860678,
      "MSE/layer0": 626.5893623860678,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.7,
      "input_norm": 31.997720209757503,
      "input_norm/layer0": 31.997720209757503,
      "learning_rate": 0.0001736842105263158,
      "loss": 1.9428,
      "max_norm": 75.36791229248047,
      "max_norm/layer0": 75.36791229248047,
      "mean_norm": 64.5310287475586,
      "mean_norm/layer0": 64.5310287475586,
      "multicode_k": 1,
      "output_norm": 14.414791498184208,
      "output_norm/layer0": 14.414791498184208,
      "step": 6700
    },
    {
      "MSE": 626.1687516276043,
      "MSE/layer0": 626.1687516276043,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.7,
      "input_norm": 31.997717237472536,
      "input_norm/layer0": 31.997717237472536,
      "learning_rate": 0.00017105263157894739,
      "loss": 1.9341,
      "max_norm": 75.49561309814453,
      "max_norm/layer0": 75.49561309814453,
      "mean_norm": 64.63836669921875,
      "mean_norm/layer0": 64.63836669921875,
      "multicode_k": 1,
      "output_norm": 14.436859647432962,
      "output_norm/layer0": 14.436859647432962,
      "step": 6750
    },
    {
      "MSE": 625.7842074584966,
      "MSE/layer0": 625.7842074584966,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.71,
      "input_norm": 31.997723042170207,
      "input_norm/layer0": 31.997723042170207,
      "learning_rate": 0.00016842105263157895,
      "loss": 1.9391,
      "max_norm": 75.62852478027344,
      "max_norm/layer0": 75.62852478027344,
      "mean_norm": 64.74386024475098,
      "mean_norm/layer0": 64.74386024475098,
      "multicode_k": 1,
      "output_norm": 14.45211536884308,
      "output_norm/layer0": 14.45211536884308,
      "step": 6800
    },
    {
      "MSE": 625.3583324178057,
      "MSE/layer0": 625.3583324178057,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.72,
      "input_norm": 31.997710723876956,
      "input_norm/layer0": 31.997710723876956,
      "learning_rate": 0.00016578947368421052,
      "loss": 1.9214,
      "max_norm": 75.7518081665039,
      "max_norm/layer0": 75.7518081665039,
      "mean_norm": 64.84785079956055,
      "mean_norm/layer0": 64.84785079956055,
      "multicode_k": 1,
      "output_norm": 14.472083713213603,
      "output_norm/layer0": 14.472083713213603,
      "step": 6850
    },
    {
      "MSE": 625.0808269246418,
      "MSE/layer0": 625.0808269246418,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.72,
      "input_norm": 31.997701005935667,
      "input_norm/layer0": 31.997701005935667,
      "learning_rate": 0.0001631578947368421,
      "loss": 1.9248,
      "max_norm": 75.8736343383789,
      "max_norm/layer0": 75.8736343383789,
      "mean_norm": 64.94989013671875,
      "mean_norm/layer0": 64.94989013671875,
      "multicode_k": 1,
      "output_norm": 14.49320138454437,
      "output_norm/layer0": 14.49320138454437,
      "step": 6900
    },
    {
      "MSE": 624.4893544514975,
      "MSE/layer0": 624.4893544514975,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.73,
      "input_norm": 31.997702992757166,
      "input_norm/layer0": 31.997702992757166,
      "learning_rate": 0.0001605263157894737,
      "loss": 1.9357,
      "max_norm": 75.99244689941406,
      "max_norm/layer0": 75.99244689941406,
      "mean_norm": 65.05006790161133,
      "mean_norm/layer0": 65.05006790161133,
      "multicode_k": 1,
      "output_norm": 14.515017460187277,
      "output_norm/layer0": 14.515017460187277,
      "step": 6950
    },
    {
      "MSE": 623.983821309408,
      "MSE/layer0": 623.983821309408,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.73,
      "input_norm": 31.997692581812547,
      "input_norm/layer0": 31.997692581812547,
      "learning_rate": 0.00015789473684210527,
      "loss": 1.9256,
      "max_norm": 76.1169204711914,
      "max_norm/layer0": 76.1169204711914,
      "mean_norm": 65.14841270446777,
      "mean_norm/layer0": 65.14841270446777,
      "multicode_k": 1,
      "output_norm": 14.531605450312297,
      "output_norm/layer0": 14.531605450312297,
      "step": 7000
    },
    {
      "epoch": 0.73,
      "eval_MSE/layer0": 623.2726008245854,
      "eval_accuracy": 0.5373965313049694,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99768957905041,
      "eval_loss": 1.9302037954330444,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.553397603295936,
      "eval_runtime": 73.3018,
      "eval_samples_per_second": 63.068,
      "eval_steps_per_second": 7.885,
      "step": 7000
    },
    {
      "MSE": 623.8173256429034,
      "MSE/layer0": 623.8173256429034,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.74,
      "input_norm": 31.997689800262457,
      "input_norm/layer0": 31.997689800262457,
      "learning_rate": 0.00015526315789473686,
      "loss": 1.9215,
      "max_norm": 76.22943115234375,
      "max_norm/layer0": 76.22943115234375,
      "mean_norm": 65.2452278137207,
      "mean_norm/layer0": 65.2452278137207,
      "multicode_k": 1,
      "output_norm": 14.544135572115584,
      "output_norm/layer0": 14.544135572115584,
      "step": 7050
    },
    {
      "MSE": 623.4564833577472,
      "MSE/layer0": 623.4564833577472,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.74,
      "input_norm": 31.997697146733607,
      "input_norm/layer0": 31.997697146733607,
      "learning_rate": 0.00015263157894736842,
      "loss": 1.9291,
      "max_norm": 76.35796356201172,
      "max_norm/layer0": 76.35796356201172,
      "mean_norm": 65.33997344970703,
      "mean_norm/layer0": 65.33997344970703,
      "multicode_k": 1,
      "output_norm": 14.557166822751359,
      "output_norm/layer0": 14.557166822751359,
      "step": 7100
    },
    {
      "MSE": 622.3157424926754,
      "MSE/layer0": 622.3157424926754,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.75,
      "input_norm": 31.997690575917574,
      "input_norm/layer0": 31.997690575917574,
      "learning_rate": 0.00015,
      "loss": 1.9272,
      "max_norm": 76.47930145263672,
      "max_norm/layer0": 76.47930145263672,
      "mean_norm": 65.4333724975586,
      "mean_norm/layer0": 65.4333724975586,
      "multicode_k": 1,
      "output_norm": 14.59491890271505,
      "output_norm/layer0": 14.59491890271505,
      "step": 7150
    },
    {
      "MSE": 622.1008169555663,
      "MSE/layer0": 622.1008169555663,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.75,
      "input_norm": 31.997691469192503,
      "input_norm/layer0": 31.997691469192503,
      "learning_rate": 0.00014736842105263158,
      "loss": 1.9421,
      "max_norm": 76.5845947265625,
      "max_norm/layer0": 76.5845947265625,
      "mean_norm": 65.52462577819824,
      "mean_norm/layer0": 65.52462577819824,
      "multicode_k": 1,
      "output_norm": 14.608456416130064,
      "output_norm/layer0": 14.608456416130064,
      "step": 7200
    },
    {
      "MSE": 621.7943653361006,
      "MSE/layer0": 621.7943653361006,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.76,
      "input_norm": 31.997678140004478,
      "input_norm/layer0": 31.997678140004478,
      "learning_rate": 0.00014473684210526317,
      "loss": 1.9221,
      "max_norm": 76.68899536132812,
      "max_norm/layer0": 76.68899536132812,
      "mean_norm": 65.61434745788574,
      "mean_norm/layer0": 65.61434745788574,
      "multicode_k": 1,
      "output_norm": 14.622403078079222,
      "output_norm/layer0": 14.622403078079222,
      "step": 7250
    },
    {
      "MSE": 621.7445918782552,
      "MSE/layer0": 621.7445918782552,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.76,
      "input_norm": 31.997679424285884,
      "input_norm/layer0": 31.997679424285884,
      "learning_rate": 0.00014210526315789474,
      "loss": 1.9172,
      "max_norm": 76.79942321777344,
      "max_norm/layer0": 76.79942321777344,
      "mean_norm": 65.70241737365723,
      "mean_norm/layer0": 65.70241737365723,
      "multicode_k": 1,
      "output_norm": 14.632240413029983,
      "output_norm/layer0": 14.632240413029983,
      "step": 7300
    },
    {
      "MSE": 621.0073055013017,
      "MSE/layer0": 621.0073055013017,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.77,
      "input_norm": 31.997667986551914,
      "input_norm/layer0": 31.997667986551914,
      "learning_rate": 0.0001394736842105263,
      "loss": 1.9187,
      "max_norm": 76.90473937988281,
      "max_norm/layer0": 76.90473937988281,
      "mean_norm": 65.78865623474121,
      "mean_norm/layer0": 65.78865623474121,
      "multicode_k": 1,
      "output_norm": 14.659644064903254,
      "output_norm/layer0": 14.659644064903254,
      "step": 7350
    },
    {
      "MSE": 620.5166587320964,
      "MSE/layer0": 620.5166587320964,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.77,
      "input_norm": 31.99766827583312,
      "input_norm/layer0": 31.99766827583312,
      "learning_rate": 0.00013684210526315792,
      "loss": 1.9236,
      "max_norm": 77.00653839111328,
      "max_norm/layer0": 77.00653839111328,
      "mean_norm": 65.87344741821289,
      "mean_norm/layer0": 65.87344741821289,
      "multicode_k": 1,
      "output_norm": 14.683248674074807,
      "output_norm/layer0": 14.683248674074807,
      "step": 7400
    },
    {
      "MSE": 620.4730934651691,
      "MSE/layer0": 620.4730934651691,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.78,
      "input_norm": 31.99766536712645,
      "input_norm/layer0": 31.99766536712645,
      "learning_rate": 0.00013421052631578948,
      "loss": 1.9181,
      "max_norm": 77.11151123046875,
      "max_norm/layer0": 77.11151123046875,
      "mean_norm": 65.95642852783203,
      "mean_norm/layer0": 65.95642852783203,
      "multicode_k": 1,
      "output_norm": 14.682427426973977,
      "output_norm/layer0": 14.682427426973977,
      "step": 7450
    },
    {
      "MSE": 619.8806704711913,
      "MSE/layer0": 619.8806704711913,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.78,
      "input_norm": 31.997652931213374,
      "input_norm/layer0": 31.997652931213374,
      "learning_rate": 0.00013157894736842105,
      "loss": 1.9204,
      "max_norm": 77.21614837646484,
      "max_norm/layer0": 77.21614837646484,
      "mean_norm": 66.03750610351562,
      "mean_norm/layer0": 66.03750610351562,
      "multicode_k": 1,
      "output_norm": 14.709125100771587,
      "output_norm/layer0": 14.709125100771587,
      "step": 7500
    },
    {
      "epoch": 0.78,
      "eval_MSE/layer0": 619.4572802491444,
      "eval_accuracy": 0.538146743438657,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997657016941467,
      "eval_loss": 1.9224542379379272,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.72584700899003,
      "eval_runtime": 73.2809,
      "eval_samples_per_second": 63.086,
      "eval_steps_per_second": 7.887,
      "step": 7500
    },
    {
      "MSE": 619.6498880004883,
      "MSE/layer0": 619.6498880004883,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.79,
      "input_norm": 31.997653865814208,
      "input_norm/layer0": 31.997653865814208,
      "learning_rate": 0.00012894736842105264,
      "loss": 1.9109,
      "max_norm": 77.3195571899414,
      "max_norm/layer0": 77.3195571899414,
      "mean_norm": 66.11709403991699,
      "mean_norm/layer0": 66.11709403991699,
      "multicode_k": 1,
      "output_norm": 14.724224853515622,
      "output_norm/layer0": 14.724224853515622,
      "step": 7550
    },
    {
      "MSE": 619.544646809896,
      "MSE/layer0": 619.544646809896,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.79,
      "input_norm": 31.997655792236333,
      "input_norm/layer0": 31.997655792236333,
      "learning_rate": 0.0001263157894736842,
      "loss": 1.9247,
      "max_norm": 77.41654205322266,
      "max_norm/layer0": 77.41654205322266,
      "mean_norm": 66.19502639770508,
      "mean_norm/layer0": 66.19502639770508,
      "multicode_k": 1,
      "output_norm": 14.729852019945778,
      "output_norm/layer0": 14.729852019945778,
      "step": 7600
    },
    {
      "MSE": 619.1442233276366,
      "MSE/layer0": 619.1442233276366,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.8,
      "input_norm": 31.99764471054077,
      "input_norm/layer0": 31.99764471054077,
      "learning_rate": 0.0001236842105263158,
      "loss": 1.9237,
      "max_norm": 77.5074234008789,
      "max_norm/layer0": 77.5074234008789,
      "mean_norm": 66.27114677429199,
      "mean_norm/layer0": 66.27114677429199,
      "multicode_k": 1,
      "output_norm": 14.745990212758379,
      "output_norm/layer0": 14.745990212758379,
      "step": 7650
    },
    {
      "MSE": 618.6404962158206,
      "MSE/layer0": 618.6404962158206,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.8,
      "input_norm": 31.997635892232267,
      "input_norm/layer0": 31.997635892232267,
      "learning_rate": 0.00012105263157894738,
      "loss": 1.913,
      "max_norm": 77.602294921875,
      "max_norm/layer0": 77.602294921875,
      "mean_norm": 66.34577751159668,
      "mean_norm/layer0": 66.34577751159668,
      "multicode_k": 1,
      "output_norm": 14.766639779408772,
      "output_norm/layer0": 14.766639779408772,
      "step": 7700
    },
    {
      "MSE": 618.2833578491213,
      "MSE/layer0": 618.2833578491213,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.81,
      "input_norm": 31.997631740570075,
      "input_norm/layer0": 31.997631740570075,
      "learning_rate": 0.00011842105263157894,
      "loss": 1.9214,
      "max_norm": 77.6917724609375,
      "max_norm/layer0": 77.6917724609375,
      "mean_norm": 66.41888046264648,
      "mean_norm/layer0": 66.41888046264648,
      "multicode_k": 1,
      "output_norm": 14.779039435386654,
      "output_norm/layer0": 14.779039435386654,
      "step": 7750
    },
    {
      "MSE": 618.2477112833653,
      "MSE/layer0": 618.2477112833653,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.81,
      "input_norm": 31.997634382247924,
      "input_norm/layer0": 31.997634382247924,
      "learning_rate": 0.00011578947368421053,
      "loss": 1.9127,
      "max_norm": 77.77839660644531,
      "max_norm/layer0": 77.77839660644531,
      "mean_norm": 66.49017333984375,
      "mean_norm/layer0": 66.49017333984375,
      "multicode_k": 1,
      "output_norm": 14.782011265754704,
      "output_norm/layer0": 14.782011265754704,
      "step": 7800
    },
    {
      "MSE": 617.7417582194005,
      "MSE/layer0": 617.7417582194005,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.82,
      "input_norm": 31.997628266016648,
      "input_norm/layer0": 31.997628266016648,
      "learning_rate": 0.00011315789473684211,
      "loss": 1.9084,
      "max_norm": 77.86212158203125,
      "max_norm/layer0": 77.86212158203125,
      "mean_norm": 66.55990791320801,
      "mean_norm/layer0": 66.55990791320801,
      "multicode_k": 1,
      "output_norm": 14.801776518821718,
      "output_norm/layer0": 14.801776518821718,
      "step": 7850
    },
    {
      "MSE": 617.339886271159,
      "MSE/layer0": 617.339886271159,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.82,
      "input_norm": 31.99762384732564,
      "input_norm/layer0": 31.99762384732564,
      "learning_rate": 0.00011052631578947368,
      "loss": 1.9115,
      "max_norm": 77.94374084472656,
      "max_norm/layer0": 77.94374084472656,
      "mean_norm": 66.62779235839844,
      "mean_norm/layer0": 66.62779235839844,
      "multicode_k": 1,
      "output_norm": 14.823196705182394,
      "output_norm/layer0": 14.823196705182394,
      "step": 7900
    },
    {
      "MSE": 617.3184334309897,
      "MSE/layer0": 617.3184334309897,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.83,
      "input_norm": 31.9976179567973,
      "input_norm/layer0": 31.9976179567973,
      "learning_rate": 0.00010789473684210527,
      "loss": 1.9136,
      "max_norm": 78.02580261230469,
      "max_norm/layer0": 78.02580261230469,
      "mean_norm": 66.69412803649902,
      "mean_norm/layer0": 66.69412803649902,
      "multicode_k": 1,
      "output_norm": 14.828250519434608,
      "output_norm/layer0": 14.828250519434608,
      "step": 7950
    },
    {
      "MSE": 616.9322255452475,
      "MSE/layer0": 616.9322255452475,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.84,
      "input_norm": 31.997613105773937,
      "input_norm/layer0": 31.997613105773937,
      "learning_rate": 0.00010526315789473683,
      "loss": 1.907,
      "max_norm": 78.10686492919922,
      "max_norm/layer0": 78.10686492919922,
      "mean_norm": 66.7584114074707,
      "mean_norm/layer0": 66.7584114074707,
      "multicode_k": 1,
      "output_norm": 14.839720834096273,
      "output_norm/layer0": 14.839720834096273,
      "step": 8000
    },
    {
      "epoch": 0.84,
      "eval_MSE/layer0": 616.4379357749087,
      "eval_accuracy": 0.5393073732024142,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99761064584294,
      "eval_loss": 1.9150168895721436,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.862492301828695,
      "eval_runtime": 73.6278,
      "eval_samples_per_second": 62.789,
      "eval_steps_per_second": 7.85,
      "step": 8000
    },
    {
      "MSE": 616.6813212076825,
      "MSE/layer0": 616.6813212076825,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.84,
      "input_norm": 31.997603750228897,
      "input_norm/layer0": 31.997603750228897,
      "learning_rate": 0.00010263157894736843,
      "loss": 1.8975,
      "max_norm": 78.18397521972656,
      "max_norm/layer0": 78.18397521972656,
      "mean_norm": 66.82158279418945,
      "mean_norm/layer0": 66.82158279418945,
      "multicode_k": 1,
      "output_norm": 14.848202861150106,
      "output_norm/layer0": 14.848202861150106,
      "step": 8050
    },
    {
      "MSE": 616.5551970418294,
      "MSE/layer0": 616.5551970418294,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.85,
      "input_norm": 31.99760689099629,
      "input_norm/layer0": 31.99760689099629,
      "learning_rate": 0.0001,
      "loss": 1.916,
      "max_norm": 78.26499938964844,
      "max_norm/layer0": 78.26499938964844,
      "mean_norm": 66.88335037231445,
      "mean_norm/layer0": 66.88335037231445,
      "multicode_k": 1,
      "output_norm": 14.8604402812322,
      "output_norm/layer0": 14.8604402812322,
      "step": 8100
    },
    {
      "MSE": 616.288039347331,
      "MSE/layer0": 616.288039347331,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.85,
      "input_norm": 31.997600466410333,
      "input_norm/layer0": 31.997600466410333,
      "learning_rate": 9.736842105263158e-05,
      "loss": 1.902,
      "max_norm": 78.33844757080078,
      "max_norm/layer0": 78.33844757080078,
      "mean_norm": 66.94340133666992,
      "mean_norm/layer0": 66.94340133666992,
      "multicode_k": 1,
      "output_norm": 14.872187639872232,
      "output_norm/layer0": 14.872187639872232,
      "step": 8150
    },
    {
      "MSE": 615.8982196044924,
      "MSE/layer0": 615.8982196044924,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.86,
      "input_norm": 31.997594718933108,
      "input_norm/layer0": 31.997594718933108,
      "learning_rate": 9.473684210526316e-05,
      "loss": 1.9142,
      "max_norm": 78.40998077392578,
      "max_norm/layer0": 78.40998077392578,
      "mean_norm": 67.00171661376953,
      "mean_norm/layer0": 67.00171661376953,
      "multicode_k": 1,
      "output_norm": 14.884622203509018,
      "output_norm/layer0": 14.884622203509018,
      "step": 8200
    },
    {
      "MSE": 615.649053141276,
      "MSE/layer0": 615.649053141276,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.86,
      "input_norm": 31.997591203053794,
      "input_norm/layer0": 31.997591203053794,
      "learning_rate": 9.210526315789474e-05,
      "loss": 1.9103,
      "max_norm": 78.47700500488281,
      "max_norm/layer0": 78.47700500488281,
      "mean_norm": 67.05831527709961,
      "mean_norm/layer0": 67.05831527709961,
      "multicode_k": 1,
      "output_norm": 14.896942078272502,
      "output_norm/layer0": 14.896942078272502,
      "step": 8250
    },
    {
      "MSE": 615.4050069173176,
      "MSE/layer0": 615.4050069173176,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.87,
      "input_norm": 31.99757507324218,
      "input_norm/layer0": 31.99757507324218,
      "learning_rate": 8.947368421052632e-05,
      "loss": 1.8999,
      "max_norm": 78.54086303710938,
      "max_norm/layer0": 78.54086303710938,
      "mean_norm": 67.11351013183594,
      "mean_norm/layer0": 67.11351013183594,
      "multicode_k": 1,
      "output_norm": 14.907591681480406,
      "output_norm/layer0": 14.907591681480406,
      "step": 8300
    },
    {
      "MSE": 615.0221789550782,
      "MSE/layer0": 615.0221789550782,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.87,
      "input_norm": 31.997587076822917,
      "input_norm/layer0": 31.997587076822917,
      "learning_rate": 8.68421052631579e-05,
      "loss": 1.9122,
      "max_norm": 78.60425567626953,
      "max_norm/layer0": 78.60425567626953,
      "mean_norm": 67.1669692993164,
      "mean_norm/layer0": 67.1669692993164,
      "multicode_k": 1,
      "output_norm": 14.918850135803218,
      "output_norm/layer0": 14.918850135803218,
      "step": 8350
    },
    {
      "MSE": 614.7660255940759,
      "MSE/layer0": 614.7660255940759,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.88,
      "input_norm": 31.99758012771608,
      "input_norm/layer0": 31.99758012771608,
      "learning_rate": 8.421052631578948e-05,
      "loss": 1.9074,
      "max_norm": 78.66250610351562,
      "max_norm/layer0": 78.66250610351562,
      "mean_norm": 67.21884536743164,
      "mean_norm/layer0": 67.21884536743164,
      "multicode_k": 1,
      "output_norm": 14.930259111722311,
      "output_norm/layer0": 14.930259111722311,
      "step": 8400
    },
    {
      "MSE": 614.4904387410484,
      "MSE/layer0": 614.4904387410484,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.88,
      "input_norm": 31.99757884025574,
      "input_norm/layer0": 31.99757884025574,
      "learning_rate": 8.157894736842105e-05,
      "loss": 1.9151,
      "max_norm": 78.7247314453125,
      "max_norm/layer0": 78.7247314453125,
      "mean_norm": 67.26914596557617,
      "mean_norm/layer0": 67.26914596557617,
      "multicode_k": 1,
      "output_norm": 14.941800510088594,
      "output_norm/layer0": 14.941800510088594,
      "step": 8450
    },
    {
      "MSE": 614.3984759521479,
      "MSE/layer0": 614.3984759521479,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.89,
      "input_norm": 31.997565978368122,
      "input_norm/layer0": 31.997565978368122,
      "learning_rate": 7.894736842105263e-05,
      "loss": 1.8931,
      "max_norm": 78.78428649902344,
      "max_norm/layer0": 78.78428649902344,
      "mean_norm": 67.31785583496094,
      "mean_norm/layer0": 67.31785583496094,
      "multicode_k": 1,
      "output_norm": 14.948297271728517,
      "output_norm/layer0": 14.948297271728517,
      "step": 8500
    },
    {
      "epoch": 0.89,
      "eval_MSE/layer0": 613.78736410403,
      "eval_accuracy": 0.5408171011151899,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997572115378908,
      "eval_loss": 1.9076036214828491,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.968526063531659,
      "eval_runtime": 73.9448,
      "eval_samples_per_second": 62.52,
      "eval_steps_per_second": 7.817,
      "step": 8500
    },
    {
      "MSE": 614.2003710937502,
      "MSE/layer0": 614.2003710937502,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.89,
      "input_norm": 31.997571328481037,
      "input_norm/layer0": 31.997571328481037,
      "learning_rate": 7.631578947368421e-05,
      "loss": 1.9006,
      "max_norm": 78.83836364746094,
      "max_norm/layer0": 78.83836364746094,
      "mean_norm": 67.36493301391602,
      "mean_norm/layer0": 67.36493301391602,
      "multicode_k": 1,
      "output_norm": 14.955024781227117,
      "output_norm/layer0": 14.955024781227117,
      "step": 8550
    },
    {
      "MSE": 613.8168900553383,
      "MSE/layer0": 613.8168900553383,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.9,
      "input_norm": 31.997557487487796,
      "input_norm/layer0": 31.997557487487796,
      "learning_rate": 7.368421052631579e-05,
      "loss": 1.9045,
      "max_norm": 78.8912582397461,
      "max_norm/layer0": 78.8912582397461,
      "mean_norm": 67.41046524047852,
      "mean_norm/layer0": 67.41046524047852,
      "multicode_k": 1,
      "output_norm": 14.968488362630207,
      "output_norm/layer0": 14.968488362630207,
      "step": 8600
    },
    {
      "MSE": 613.6968625895179,
      "MSE/layer0": 613.6968625895179,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.9,
      "input_norm": 31.99754828453064,
      "input_norm/layer0": 31.99754828453064,
      "learning_rate": 7.105263157894737e-05,
      "loss": 1.9009,
      "max_norm": 78.942626953125,
      "max_norm/layer0": 78.942626953125,
      "mean_norm": 67.45438766479492,
      "mean_norm/layer0": 67.45438766479492,
      "multicode_k": 1,
      "output_norm": 14.979475774765014,
      "output_norm/layer0": 14.979475774765014,
      "step": 8650
    },
    {
      "MSE": 613.3956824747725,
      "MSE/layer0": 613.3956824747725,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.91,
      "input_norm": 31.997546965281174,
      "input_norm/layer0": 31.997546965281174,
      "learning_rate": 6.842105263157896e-05,
      "loss": 1.9,
      "max_norm": 78.99479675292969,
      "max_norm/layer0": 78.99479675292969,
      "mean_norm": 67.49666595458984,
      "mean_norm/layer0": 67.49666595458984,
      "multicode_k": 1,
      "output_norm": 14.988234910964966,
      "output_norm/layer0": 14.988234910964966,
      "step": 8700
    },
    {
      "MSE": 613.2128627522789,
      "MSE/layer0": 613.2128627522789,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.91,
      "input_norm": 31.997544927597048,
      "input_norm/layer0": 31.997544927597048,
      "learning_rate": 6.578947368421052e-05,
      "loss": 1.9059,
      "max_norm": 79.04541015625,
      "max_norm/layer0": 79.04541015625,
      "mean_norm": 67.53742218017578,
      "mean_norm/layer0": 67.53742218017578,
      "multicode_k": 1,
      "output_norm": 14.991036421457924,
      "output_norm/layer0": 14.991036421457924,
      "step": 8750
    },
    {
      "MSE": 612.9370720418297,
      "MSE/layer0": 612.9370720418297,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.92,
      "input_norm": 31.99753908475239,
      "input_norm/layer0": 31.99753908475239,
      "learning_rate": 6.31578947368421e-05,
      "loss": 1.9023,
      "max_norm": 79.09040069580078,
      "max_norm/layer0": 79.09040069580078,
      "mean_norm": 67.57658767700195,
      "mean_norm/layer0": 67.57658767700195,
      "multicode_k": 1,
      "output_norm": 15.003661061922706,
      "output_norm/layer0": 15.003661061922706,
      "step": 8800
    },
    {
      "MSE": 613.0978963216148,
      "MSE/layer0": 613.0978963216148,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.92,
      "input_norm": 31.997535756429023,
      "input_norm/layer0": 31.997535756429023,
      "learning_rate": 6.052631578947369e-05,
      "loss": 1.9004,
      "max_norm": 79.13478088378906,
      "max_norm/layer0": 79.13478088378906,
      "mean_norm": 67.61412811279297,
      "mean_norm/layer0": 67.61412811279297,
      "multicode_k": 1,
      "output_norm": 14.999437109629307,
      "output_norm/layer0": 14.999437109629307,
      "step": 8850
    },
    {
      "MSE": 612.746408691406,
      "MSE/layer0": 612.746408691406,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.93,
      "input_norm": 31.997531512578334,
      "input_norm/layer0": 31.997531512578334,
      "learning_rate": 5.789473684210527e-05,
      "loss": 1.8947,
      "max_norm": 79.17863464355469,
      "max_norm/layer0": 79.17863464355469,
      "mean_norm": 67.65010452270508,
      "mean_norm/layer0": 67.65010452270508,
      "multicode_k": 1,
      "output_norm": 15.013854147593182,
      "output_norm/layer0": 15.013854147593182,
      "step": 8900
    },
    {
      "MSE": 612.5075473022462,
      "MSE/layer0": 612.5075473022462,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.93,
      "input_norm": 31.997522573471066,
      "input_norm/layer0": 31.997522573471066,
      "learning_rate": 5.526315789473684e-05,
      "loss": 1.888,
      "max_norm": 79.2198257446289,
      "max_norm/layer0": 79.2198257446289,
      "mean_norm": 67.6845588684082,
      "mean_norm/layer0": 67.6845588684082,
      "multicode_k": 1,
      "output_norm": 15.024005990028382,
      "output_norm/layer0": 15.024005990028382,
      "step": 8950
    },
    {
      "MSE": 612.4464337158204,
      "MSE/layer0": 612.4464337158204,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.94,
      "input_norm": 31.99751985549927,
      "input_norm/layer0": 31.99751985549927,
      "learning_rate": 5.263157894736842e-05,
      "loss": 1.9021,
      "max_norm": 79.25985717773438,
      "max_norm/layer0": 79.25985717773438,
      "mean_norm": 67.71733856201172,
      "mean_norm/layer0": 67.71733856201172,
      "multicode_k": 1,
      "output_norm": 15.025202210744226,
      "output_norm/layer0": 15.025202210744226,
      "step": 9000
    },
    {
      "epoch": 0.94,
      "eval_MSE/layer0": 612.012579843437,
      "eval_accuracy": 0.5416772654217966,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99751990196794,
      "eval_loss": 1.90205979347229,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 15.037853428586699,
      "eval_runtime": 73.2981,
      "eval_samples_per_second": 63.071,
      "eval_steps_per_second": 7.886,
      "step": 9000
    },
    {
      "MSE": 612.1616466267901,
      "MSE/layer0": 612.1616466267901,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.94,
      "input_norm": 31.997515144348153,
      "input_norm/layer0": 31.997515144348153,
      "learning_rate": 5e-05,
      "loss": 1.8979,
      "max_norm": 79.2950668334961,
      "max_norm/layer0": 79.2950668334961,
      "mean_norm": 67.74863052368164,
      "mean_norm/layer0": 67.74863052368164,
      "multicode_k": 1,
      "output_norm": 15.036479252179465,
      "output_norm/layer0": 15.036479252179465,
      "step": 9050
    },
    {
      "MSE": 611.8442991129552,
      "MSE/layer0": 611.8442991129552,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.95,
      "input_norm": 31.99751302719116,
      "input_norm/layer0": 31.99751302719116,
      "learning_rate": 4.736842105263158e-05,
      "loss": 1.8978,
      "max_norm": 79.32892608642578,
      "max_norm/layer0": 79.32892608642578,
      "mean_norm": 67.77827835083008,
      "mean_norm/layer0": 67.77827835083008,
      "multicode_k": 1,
      "output_norm": 15.046743833223978,
      "output_norm/layer0": 15.046743833223978,
      "step": 9100
    },
    {
      "MSE": 611.9183032226562,
      "MSE/layer0": 611.9183032226562,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.96,
      "input_norm": 31.99751057942708,
      "input_norm/layer0": 31.99751057942708,
      "learning_rate": 4.473684210526316e-05,
      "loss": 1.8971,
      "max_norm": 79.36182403564453,
      "max_norm/layer0": 79.36182403564453,
      "mean_norm": 67.80632781982422,
      "mean_norm/layer0": 67.80632781982422,
      "multicode_k": 1,
      "output_norm": 15.041637244224557,
      "output_norm/layer0": 15.041637244224557,
      "step": 9150
    },
    {
      "MSE": 611.5441438802083,
      "MSE/layer0": 611.5441438802083,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.96,
      "input_norm": 31.99750095685323,
      "input_norm/layer0": 31.99750095685323,
      "learning_rate": 4.210526315789474e-05,
      "loss": 1.8874,
      "max_norm": 79.39281463623047,
      "max_norm/layer0": 79.39281463623047,
      "mean_norm": 67.83284759521484,
      "mean_norm/layer0": 67.83284759521484,
      "multicode_k": 1,
      "output_norm": 15.055660729408274,
      "output_norm/layer0": 15.055660729408274,
      "step": 9200
    },
    {
      "MSE": 611.5922235107425,
      "MSE/layer0": 611.5922235107425,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.97,
      "input_norm": 31.99750220934551,
      "input_norm/layer0": 31.99750220934551,
      "learning_rate": 3.9473684210526316e-05,
      "loss": 1.8958,
      "max_norm": 79.42273712158203,
      "max_norm/layer0": 79.42273712158203,
      "mean_norm": 67.85774230957031,
      "mean_norm/layer0": 67.85774230957031,
      "multicode_k": 1,
      "output_norm": 15.055747102101643,
      "output_norm/layer0": 15.055747102101643,
      "step": 9250
    },
    {
      "MSE": 611.6544079589839,
      "MSE/layer0": 611.6544079589839,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.97,
      "input_norm": 31.997499033610026,
      "input_norm/layer0": 31.997499033610026,
      "learning_rate": 3.6842105263157895e-05,
      "loss": 1.8915,
      "max_norm": 79.44976806640625,
      "max_norm/layer0": 79.44976806640625,
      "mean_norm": 67.88099670410156,
      "mean_norm/layer0": 67.88099670410156,
      "multicode_k": 1,
      "output_norm": 15.057963668505355,
      "output_norm/layer0": 15.057963668505355,
      "step": 9300
    },
    {
      "MSE": 611.321997172038,
      "MSE/layer0": 611.321997172038,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.98,
      "input_norm": 31.997498153050746,
      "input_norm/layer0": 31.997498153050746,
      "learning_rate": 3.421052631578948e-05,
      "loss": 1.8893,
      "max_norm": 79.47447967529297,
      "max_norm/layer0": 79.47447967529297,
      "mean_norm": 67.90266799926758,
      "mean_norm/layer0": 67.90266799926758,
      "multicode_k": 1,
      "output_norm": 15.067080327669775,
      "output_norm/layer0": 15.067080327669775,
      "step": 9350
    },
    {
      "MSE": 611.4500786336266,
      "MSE/layer0": 611.4500786336266,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.98,
      "input_norm": 31.997495447794595,
      "input_norm/layer0": 31.997495447794595,
      "learning_rate": 3.157894736842105e-05,
      "loss": 1.894,
      "max_norm": 79.49812316894531,
      "max_norm/layer0": 79.49812316894531,
      "mean_norm": 67.92279815673828,
      "mean_norm/layer0": 67.92279815673828,
      "multicode_k": 1,
      "output_norm": 15.062444001833596,
      "output_norm/layer0": 15.062444001833596,
      "step": 9400
    },
    {
      "MSE": 611.1107730102539,
      "MSE/layer0": 611.1107730102539,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.99,
      "input_norm": 31.997485151290896,
      "input_norm/layer0": 31.997485151290896,
      "learning_rate": 2.8947368421052634e-05,
      "loss": 1.8849,
      "max_norm": 79.52143096923828,
      "max_norm/layer0": 79.52143096923828,
      "mean_norm": 67.94132995605469,
      "mean_norm/layer0": 67.94132995605469,
      "multicode_k": 1,
      "output_norm": 15.076274760564168,
      "output_norm/layer0": 15.076274760564168,
      "step": 9450
    },
    {
      "MSE": 611.3009430948896,
      "MSE/layer0": 611.3009430948896,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.99,
      "input_norm": 31.99749323209126,
      "input_norm/layer0": 31.99749323209126,
      "learning_rate": 2.631578947368421e-05,
      "loss": 1.8967,
      "max_norm": 79.54227447509766,
      "max_norm/layer0": 79.54227447509766,
      "mean_norm": 67.958251953125,
      "mean_norm/layer0": 67.958251953125,
      "multicode_k": 1,
      "output_norm": 15.06888332684835,
      "output_norm/layer0": 15.06888332684835,
      "step": 9500
    },
    {
      "epoch": 0.99,
      "eval_MSE/layer0": 610.6120883183328,
      "eval_accuracy": 0.5425511737500183,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.99749166347134,
      "eval_loss": 1.8969556093215942,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 15.09320597480496,
      "eval_runtime": 73.3984,
      "eval_samples_per_second": 62.985,
      "eval_steps_per_second": 7.875,
      "step": 9500
    },
    {
      "MSE": 610.9202908325196,
      "MSE/layer0": 610.9202908325196,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.0,
      "input_norm": 31.99748815218606,
      "input_norm/layer0": 31.99748815218606,
      "learning_rate": 2.368421052631579e-05,
      "loss": 1.8917,
      "max_norm": 79.56092834472656,
      "max_norm/layer0": 79.56092834472656,
      "mean_norm": 67.97361755371094,
      "mean_norm/layer0": 67.97361755371094,
      "multicode_k": 1,
      "output_norm": 15.084220841725665,
      "output_norm/layer0": 15.084220841725665,
      "step": 9550
    },
    {
      "MSE": 610.9847631835939,
      "MSE/layer0": 610.9847631835939,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.0,
      "input_norm": 31.997486731211332,
      "input_norm/layer0": 31.997486731211332,
      "learning_rate": 2.105263157894737e-05,
      "loss": 1.8839,
      "max_norm": 79.57735443115234,
      "max_norm/layer0": 79.57735443115234,
      "mean_norm": 67.98743438720703,
      "mean_norm/layer0": 67.98743438720703,
      "multicode_k": 1,
      "output_norm": 15.082832886377968,
      "output_norm/layer0": 15.082832886377968,
      "step": 9600
    },
    {
      "MSE": 611.2879392496747,
      "MSE/layer0": 611.2879392496747,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.01,
      "input_norm": 31.997482639948544,
      "input_norm/layer0": 31.997482639948544,
      "learning_rate": 1.8421052631578947e-05,
      "loss": 1.8851,
      "max_norm": 79.59221649169922,
      "max_norm/layer0": 79.59221649169922,
      "mean_norm": 67.99962997436523,
      "mean_norm/layer0": 67.99962997436523,
      "multicode_k": 1,
      "output_norm": 15.075549699465444,
      "output_norm/layer0": 15.075549699465444,
      "step": 9650
    },
    {
      "MSE": 611.3861442057291,
      "MSE/layer0": 611.3861442057291,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.01,
      "input_norm": 31.997482592264817,
      "input_norm/layer0": 31.997482592264817,
      "learning_rate": 1.5789473684210526e-05,
      "loss": 1.8774,
      "max_norm": 79.60480499267578,
      "max_norm/layer0": 79.60480499267578,
      "mean_norm": 68.01019668579102,
      "mean_norm/layer0": 68.01019668579102,
      "multicode_k": 1,
      "output_norm": 15.07396024545034,
      "output_norm/layer0": 15.07396024545034,
      "step": 9700
    },
    {
      "MSE": 611.4255168660482,
      "MSE/layer0": 611.4255168660482,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.02,
      "input_norm": 31.997479289372762,
      "input_norm/layer0": 31.997479289372762,
      "learning_rate": 1.3157894736842104e-05,
      "loss": 1.8768,
      "max_norm": 79.6154556274414,
      "max_norm/layer0": 79.6154556274414,
      "mean_norm": 68.01911926269531,
      "mean_norm/layer0": 68.01911926269531,
      "multicode_k": 1,
      "output_norm": 15.07339178085327,
      "output_norm/layer0": 15.07339178085327,
      "step": 9750
    },
    {
      "MSE": 611.6131436157225,
      "MSE/layer0": 611.6131436157225,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.02,
      "input_norm": 31.99748600323995,
      "input_norm/layer0": 31.99748600323995,
      "learning_rate": 1.0526315789473684e-05,
      "loss": 1.8905,
      "max_norm": 79.62410736083984,
      "max_norm/layer0": 79.62410736083984,
      "mean_norm": 68.02641677856445,
      "mean_norm/layer0": 68.02641677856445,
      "multicode_k": 1,
      "output_norm": 15.068124500910447,
      "output_norm/layer0": 15.068124500910447,
      "step": 9800
    },
    {
      "MSE": 611.5507637532555,
      "MSE/layer0": 611.5507637532555,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.03,
      "input_norm": 31.997482582728068,
      "input_norm/layer0": 31.997482582728068,
      "learning_rate": 7.894736842105263e-06,
      "loss": 1.8798,
      "max_norm": 79.63082122802734,
      "max_norm/layer0": 79.63082122802734,
      "mean_norm": 68.03211212158203,
      "mean_norm/layer0": 68.03211212158203,
      "multicode_k": 1,
      "output_norm": 15.072520554860436,
      "output_norm/layer0": 15.072520554860436,
      "step": 9850
    },
    {
      "MSE": 611.7908610026044,
      "MSE/layer0": 611.7908610026044,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.03,
      "input_norm": 31.99747860272725,
      "input_norm/layer0": 31.99747860272725,
      "learning_rate": 5.263157894736842e-06,
      "loss": 1.8807,
      "max_norm": 79.63563537597656,
      "max_norm/layer0": 79.63563537597656,
      "mean_norm": 68.03619003295898,
      "mean_norm/layer0": 68.03619003295898,
      "multicode_k": 1,
      "output_norm": 15.06489105542501,
      "output_norm/layer0": 15.06489105542501,
      "step": 9900
    },
    {
      "MSE": 611.5220219930011,
      "MSE/layer0": 611.5220219930011,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.04,
      "input_norm": 31.997478488286326,
      "input_norm/layer0": 31.997478488286326,
      "learning_rate": 2.631578947368421e-06,
      "loss": 1.8795,
      "max_norm": 79.63849639892578,
      "max_norm/layer0": 79.63849639892578,
      "mean_norm": 68.03863906860352,
      "mean_norm/layer0": 68.03863906860352,
      "multicode_k": 1,
      "output_norm": 15.07397619565328,
      "output_norm/layer0": 15.07397619565328,
      "step": 9950
    },
    {
      "MSE": 611.5742947387696,
      "MSE/layer0": 611.5742947387696,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 1.04,
      "input_norm": 31.997486855189003,
      "input_norm/layer0": 31.997486855189003,
      "learning_rate": 0.0,
      "loss": 1.8942,
      "max_norm": 79.63946533203125,
      "max_norm/layer0": 79.63946533203125,
      "mean_norm": 68.03947448730469,
      "mean_norm/layer0": 68.03947448730469,
      "multicode_k": 1,
      "output_norm": 15.069696005185442,
      "output_norm/layer0": 15.069696005185442,
      "step": 10000
    },
    {
      "epoch": 1.04,
      "eval_MSE/layer0": 611.1571513346564,
      "eval_accuracy": 0.5429091526514649,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.997479090978388,
      "eval_loss": 1.89570152759552,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 15.087154228553715,
      "eval_runtime": 73.2125,
      "eval_samples_per_second": 63.145,
      "eval_steps_per_second": 7.895,
      "step": 10000
    },
    {
      "MSE": 0.0,
      "MSE/layer0": 0.0,
      "dead_code_fraction": 1.0,
      "dead_code_fraction/layer0": 1.0,
      "epoch": 1.04,
      "input_norm": 0.0,
      "input_norm/layer0": 0.0,
      "max_norm": 79.63946533203125,
      "max_norm/layer0": 79.63946533203125,
      "mean_norm": 68.03947448730469,
      "mean_norm/layer0": 68.03947448730469,
      "multicode_k": 1,
      "output_norm": 0.0,
      "output_norm/layer0": 0.0,
      "step": 10000,
      "total_flos": 3.715683581952e+16,
      "train_loss": 2.0762174885749816,
      "train_runtime": 12054.7701,
      "train_samples_per_second": 39.818,
      "train_steps_per_second": 0.83
    }
  ],
  "logging_steps": 50,
  "max_steps": 10000,
  "num_train_epochs": 2,
  "save_steps": 500,
  "total_flos": 3.715683581952e+16,
  "trial_name": null,
  "trial_params": null
}