{ "best_metric": null, "best_model_checkpoint": null, "epoch": 6.263048016701461, "global_step": 15000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.0, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 10.4479, "max_norm": 11.935791969299316, "max_norm/layer0": 11.528828620910645, "max_norm/layer1": 11.179052352905273, "max_norm/layer10": 11.443963050842285, "max_norm/layer11": 11.457213401794434, "max_norm/layer12": 11.09423828125, "max_norm/layer13": 10.991622924804688, "max_norm/layer14": 11.824307441711426, "max_norm/layer15": 11.151399612426758, "max_norm/layer16": 10.765336990356445, "max_norm/layer17": 11.6915922164917, "max_norm/layer18": 11.321767807006836, "max_norm/layer19": 11.388019561767578, "max_norm/layer2": 11.24202823638916, "max_norm/layer20": 11.28963851928711, "max_norm/layer21": 11.935791969299316, "max_norm/layer22": 11.426197052001953, "max_norm/layer23": 11.311007499694824, "max_norm/layer3": 11.2095308303833, "max_norm/layer4": 11.231363296508789, "max_norm/layer5": 11.49493408203125, "max_norm/layer6": 11.883358001708984, "max_norm/layer7": 11.410587310791016, "max_norm/layer8": 11.1673002243042, "max_norm/layer9": 11.320834159851074, "mean_norm": 7.9688674112161, "mean_norm/layer0": 7.968748152256012, "mean_norm/layer1": 7.968711107969284, "mean_norm/layer10": 7.96820729970932, "mean_norm/layer11": 7.968186259269714, "mean_norm/layer12": 7.971881151199341, "mean_norm/layer13": 7.9677393436431885, "mean_norm/layer14": 7.970236927270889, "mean_norm/layer15": 7.966938257217407, "mean_norm/layer16": 7.970880895853043, "mean_norm/layer17": 7.967200756072998, "mean_norm/layer18": 7.965942770242691, "mean_norm/layer19": 7.964955180883408, "mean_norm/layer2": 7.967412292957306, "mean_norm/layer20": 7.969712853431702, "mean_norm/layer21": 7.970251560211182, "mean_norm/layer22": 7.968287110328674, "mean_norm/layer23": 7.970414459705353, "mean_norm/layer3": 7.969215750694275, "mean_norm/layer4": 7.969323754310608, "mean_norm/layer5": 7.97068253159523, "mean_norm/layer6": 7.97090882062912, "mean_norm/layer7": 7.968297064304352, "mean_norm/layer8": 7.970566779375076, "mean_norm/layer9": 7.968116790056229, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.02, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 7.6233, "max_norm": 11.93603801727295, "max_norm/layer0": 11.531795501708984, "max_norm/layer1": 11.179537773132324, "max_norm/layer10": 11.448348045349121, "max_norm/layer11": 11.457023620605469, "max_norm/layer12": 11.094408988952637, "max_norm/layer13": 10.990287780761719, "max_norm/layer14": 11.82107925415039, "max_norm/layer15": 11.15367603302002, "max_norm/layer16": 10.769166946411133, "max_norm/layer17": 11.686759948730469, "max_norm/layer18": 11.32666301727295, "max_norm/layer19": 11.391281127929688, "max_norm/layer2": 11.241073608398438, "max_norm/layer20": 11.291045188903809, "max_norm/layer21": 11.93603801727295, "max_norm/layer22": 11.42624282836914, "max_norm/layer23": 11.311007499694824, "max_norm/layer3": 11.2095308303833, "max_norm/layer4": 11.232872009277344, "max_norm/layer5": 11.487099647521973, "max_norm/layer6": 11.881125450134277, "max_norm/layer7": 11.410587310791016, "max_norm/layer8": 11.176557540893555, "max_norm/layer9": 11.321023941040039, "mean_norm": 7.971554110447566, "mean_norm/layer0": 7.994439959526062, "mean_norm/layer1": 7.975339025259018, "mean_norm/layer10": 7.969327986240387, "mean_norm/layer11": 7.969180196523666, "mean_norm/layer12": 7.972845375537872, "mean_norm/layer13": 7.968711882829666, "mean_norm/layer14": 7.971314698457718, "mean_norm/layer15": 7.9680851101875305, "mean_norm/layer16": 7.971889913082123, "mean_norm/layer17": 7.968462765216827, "mean_norm/layer18": 7.966999590396881, "mean_norm/layer19": 7.9660108387470245, "mean_norm/layer2": 7.969779163599014, "mean_norm/layer20": 7.9709367752075195, "mean_norm/layer21": 7.971419245004654, "mean_norm/layer22": 7.969498664140701, "mean_norm/layer23": 7.971314489841461, "mean_norm/layer3": 7.973078697919846, "mean_norm/layer4": 7.971539229154587, "mean_norm/layer5": 7.973774015903473, "mean_norm/layer6": 7.972526788711548, "mean_norm/layer7": 7.969632714986801, "mean_norm/layer8": 7.971796870231628, "mean_norm/layer9": 7.969394654035568, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 50 }, { "epoch": 0.02, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.1632291324434277, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 5.859389781951904, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8439, "eval_samples_per_second": 20.348, "eval_steps_per_second": 0.675, "step": 50 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.04, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 4.8681, "max_norm": 11.938570022583008, "max_norm/layer0": 11.561639785766602, "max_norm/layer1": 11.204116821289062, "max_norm/layer10": 11.462130546569824, "max_norm/layer11": 11.474141120910645, "max_norm/layer12": 11.094062805175781, "max_norm/layer13": 11.00002670288086, "max_norm/layer14": 11.826424598693848, "max_norm/layer15": 11.166800498962402, "max_norm/layer16": 10.781830787658691, "max_norm/layer17": 11.687150001525879, "max_norm/layer18": 11.340291023254395, "max_norm/layer19": 11.40336799621582, "max_norm/layer2": 11.241272926330566, "max_norm/layer20": 11.293827056884766, "max_norm/layer21": 11.938570022583008, "max_norm/layer22": 11.450465202331543, "max_norm/layer23": 11.329928398132324, "max_norm/layer3": 11.215670585632324, "max_norm/layer4": 11.24952507019043, "max_norm/layer5": 11.489554405212402, "max_norm/layer6": 11.858213424682617, "max_norm/layer7": 11.412649154663086, "max_norm/layer8": 11.180521011352539, "max_norm/layer9": 11.323616981506348, "mean_norm": 7.995976222058137, "mean_norm/layer0": 8.02781367301941, "mean_norm/layer1": 8.001955300569534, "mean_norm/layer10": 7.991945534944534, "mean_norm/layer11": 7.994345277547836, "mean_norm/layer12": 7.9973015785217285, "mean_norm/layer13": 7.990174353122711, "mean_norm/layer14": 7.994365036487579, "mean_norm/layer15": 7.9937964379787445, "mean_norm/layer16": 7.993947863578796, "mean_norm/layer17": 7.9963139295578, "mean_norm/layer18": 7.992857217788696, "mean_norm/layer19": 7.993478715419769, "mean_norm/layer2": 7.984907865524292, "mean_norm/layer20": 7.996965527534485, "mean_norm/layer21": 7.9976761639118195, "mean_norm/layer22": 7.997446715831757, "mean_norm/layer23": 7.995190799236298, "mean_norm/layer3": 8.00449624657631, "mean_norm/layer4": 7.99257630109787, "mean_norm/layer5": 8.008823156356812, "mean_norm/layer6": 7.9886175096035, "mean_norm/layer7": 7.985989451408386, "mean_norm/layer8": 7.991247743368149, "mean_norm/layer9": 7.991196930408478, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 100 }, { "epoch": 0.04, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.3217572593827446, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.9806430339813232, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8323, "eval_samples_per_second": 20.368, "eval_steps_per_second": 0.676, "step": 100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.06, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.8442, "max_norm": 11.94873046875, "max_norm/layer0": 11.583314895629883, "max_norm/layer1": 11.257062911987305, "max_norm/layer10": 11.477036476135254, "max_norm/layer11": 11.486359596252441, "max_norm/layer12": 11.094036102294922, "max_norm/layer13": 11.006564140319824, "max_norm/layer14": 11.83369255065918, "max_norm/layer15": 11.174107551574707, "max_norm/layer16": 10.795401573181152, "max_norm/layer17": 11.689741134643555, "max_norm/layer18": 11.353045463562012, "max_norm/layer19": 11.423429489135742, "max_norm/layer2": 11.241215705871582, "max_norm/layer20": 11.297418594360352, "max_norm/layer21": 11.94873046875, "max_norm/layer22": 11.467409133911133, "max_norm/layer23": 11.351099014282227, "max_norm/layer3": 11.237198829650879, "max_norm/layer4": 11.2833833694458, "max_norm/layer5": 11.501317024230957, "max_norm/layer6": 11.842484474182129, "max_norm/layer7": 11.412476539611816, "max_norm/layer8": 11.197505950927734, "max_norm/layer9": 11.32548713684082, "mean_norm": 8.025902200490236, "mean_norm/layer0": 8.05369970202446, "mean_norm/layer1": 8.029805958271027, "mean_norm/layer10": 8.019342005252838, "mean_norm/layer11": 8.026309847831726, "mean_norm/layer12": 8.027727752923965, "mean_norm/layer13": 8.017128229141235, "mean_norm/layer14": 8.023246347904205, "mean_norm/layer15": 8.024851232767105, "mean_norm/layer16": 8.020187258720398, "mean_norm/layer17": 8.030142724514008, "mean_norm/layer18": 8.022860586643219, "mean_norm/layer19": 8.024217784404755, "mean_norm/layer2": 8.00149068236351, "mean_norm/layer20": 8.02658200263977, "mean_norm/layer21": 8.028845071792603, "mean_norm/layer22": 8.0383882522583, "mean_norm/layer23": 8.036098837852478, "mean_norm/layer3": 8.042394787073135, "mean_norm/layer4": 8.019146829843521, "mean_norm/layer5": 8.053219020366669, "mean_norm/layer6": 8.007382929325104, "mean_norm/layer7": 8.00985363125801, "mean_norm/layer8": 8.019103825092316, "mean_norm/layer9": 8.019627511501312, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 150 }, { "epoch": 0.06, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.35747922269137633, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.630153179168701, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8097, "eval_samples_per_second": 20.407, "eval_steps_per_second": 0.677, "step": 150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.08, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.6253, "max_norm": 11.97680950164795, "max_norm/layer0": 11.58055591583252, "max_norm/layer1": 11.294157028198242, "max_norm/layer10": 11.497956275939941, "max_norm/layer11": 11.496185302734375, "max_norm/layer12": 11.096875190734863, "max_norm/layer13": 11.013715744018555, "max_norm/layer14": 11.834508895874023, "max_norm/layer15": 11.183530807495117, "max_norm/layer16": 10.824295043945312, "max_norm/layer17": 11.690849304199219, "max_norm/layer18": 11.363268852233887, "max_norm/layer19": 11.44228744506836, "max_norm/layer2": 11.241418838500977, "max_norm/layer20": 11.30195140838623, "max_norm/layer21": 11.97680950164795, "max_norm/layer22": 11.490119934082031, "max_norm/layer23": 11.360661506652832, "max_norm/layer3": 11.250357627868652, "max_norm/layer4": 11.294978141784668, "max_norm/layer5": 11.523475646972656, "max_norm/layer6": 11.833582878112793, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.238706588745117, "max_norm/layer9": 11.328913688659668, "mean_norm": 8.050771818806728, "mean_norm/layer0": 8.074532568454742, "mean_norm/layer1": 8.053631067276001, "mean_norm/layer10": 8.043468981981277, "mean_norm/layer11": 8.05247575044632, "mean_norm/layer12": 8.05384948849678, "mean_norm/layer13": 8.039159834384918, "mean_norm/layer14": 8.047386288642883, "mean_norm/layer15": 8.051487892866135, "mean_norm/layer16": 8.041515946388245, "mean_norm/layer17": 8.056637048721313, "mean_norm/layer18": 8.044140785932541, "mean_norm/layer19": 8.046563893556595, "mean_norm/layer2": 8.015393018722534, "mean_norm/layer20": 8.04814100265503, "mean_norm/layer21": 8.051321744918823, "mean_norm/layer22": 8.069881677627563, "mean_norm/layer23": 8.0706427693367, "mean_norm/layer3": 8.075534343719482, "mean_norm/layer4": 8.043230772018433, "mean_norm/layer5": 8.093363732099533, "mean_norm/layer6": 8.024461150169373, "mean_norm/layer7": 8.032397478818893, "mean_norm/layer8": 8.044481456279755, "mean_norm/layer9": 8.044824957847595, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 200 }, { "epoch": 0.08, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.37222310104119766, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.484011650085449, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8014, "eval_samples_per_second": 22.312, "eval_steps_per_second": 0.741, "step": 200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.1, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.5035, "max_norm": 12.000293731689453, "max_norm/layer0": 11.585112571716309, "max_norm/layer1": 11.333687782287598, "max_norm/layer10": 11.51988410949707, "max_norm/layer11": 11.502758979797363, "max_norm/layer12": 11.100769996643066, "max_norm/layer13": 11.01984977722168, "max_norm/layer14": 11.828566551208496, "max_norm/layer15": 11.194990158081055, "max_norm/layer16": 10.869253158569336, "max_norm/layer17": 11.693120002746582, "max_norm/layer18": 11.377907752990723, "max_norm/layer19": 11.457249641418457, "max_norm/layer2": 11.241273880004883, "max_norm/layer20": 11.306483268737793, "max_norm/layer21": 12.000293731689453, "max_norm/layer22": 11.509583473205566, "max_norm/layer23": 11.3687744140625, "max_norm/layer3": 11.266392707824707, "max_norm/layer4": 11.302397727966309, "max_norm/layer5": 11.550718307495117, "max_norm/layer6": 11.818743705749512, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.272293090820312, "max_norm/layer9": 11.33436107635498, "mean_norm": 8.074364328136047, "mean_norm/layer0": 8.09387719631195, "mean_norm/layer1": 8.07526409626007, "mean_norm/layer10": 8.067595720291138, "mean_norm/layer11": 8.078146398067474, "mean_norm/layer12": 8.079148262739182, "mean_norm/layer13": 8.059981882572174, "mean_norm/layer14": 8.070948004722595, "mean_norm/layer15": 8.077279716730118, "mean_norm/layer16": 8.061559438705444, "mean_norm/layer17": 8.080615043640137, "mean_norm/layer18": 8.063488155603409, "mean_norm/layer19": 8.066218882799149, "mean_norm/layer2": 8.028005808591843, "mean_norm/layer20": 8.067834615707397, "mean_norm/layer21": 8.071941196918488, "mean_norm/layer22": 8.098706185817719, "mean_norm/layer23": 8.10308825969696, "mean_norm/layer3": 8.106619775295258, "mean_norm/layer4": 8.066012859344482, "mean_norm/layer5": 8.132562160491943, "mean_norm/layer6": 8.041042983531952, "mean_norm/layer7": 8.054872512817383, "mean_norm/layer8": 8.07003739476204, "mean_norm/layer9": 8.069897323846817, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 250 }, { "epoch": 0.1, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.38236737607638427, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.3861122131347656, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.55, "eval_samples_per_second": 20.866, "eval_steps_per_second": 0.693, "step": 250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.13, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.4446, "max_norm": 12.001006126403809, "max_norm/layer0": 11.589604377746582, "max_norm/layer1": 11.3706693649292, "max_norm/layer10": 11.548222541809082, "max_norm/layer11": 11.507245063781738, "max_norm/layer12": 11.113755226135254, "max_norm/layer13": 11.024701118469238, "max_norm/layer14": 11.826601028442383, "max_norm/layer15": 11.213644027709961, "max_norm/layer16": 10.893625259399414, "max_norm/layer17": 11.694713592529297, "max_norm/layer18": 11.386850357055664, "max_norm/layer19": 11.475567817687988, "max_norm/layer2": 11.24197769165039, "max_norm/layer20": 11.314746856689453, "max_norm/layer21": 12.001006126403809, "max_norm/layer22": 11.535944938659668, "max_norm/layer23": 11.374551773071289, "max_norm/layer3": 11.290938377380371, "max_norm/layer4": 11.314577102661133, "max_norm/layer5": 11.561954498291016, "max_norm/layer6": 11.800447463989258, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.313380241394043, "max_norm/layer9": 11.339631080627441, "mean_norm": 8.098208792507648, "mean_norm/layer0": 8.112719625234604, "mean_norm/layer1": 8.09641945362091, "mean_norm/layer10": 8.09212476015091, "mean_norm/layer11": 8.104212701320648, "mean_norm/layer12": 8.105414420366287, "mean_norm/layer13": 8.080646514892578, "mean_norm/layer14": 8.094950437545776, "mean_norm/layer15": 8.103815019130707, "mean_norm/layer16": 8.082140505313873, "mean_norm/layer17": 8.104914009571075, "mean_norm/layer18": 8.082397997379303, "mean_norm/layer19": 8.085450172424316, "mean_norm/layer2": 8.041804730892181, "mean_norm/layer20": 8.088390350341797, "mean_norm/layer21": 8.09272289276123, "mean_norm/layer22": 8.127672553062439, "mean_norm/layer23": 8.135194897651672, "mean_norm/layer3": 8.137898802757263, "mean_norm/layer4": 8.089071333408356, "mean_norm/layer5": 8.171739280223846, "mean_norm/layer6": 8.057810544967651, "mean_norm/layer7": 8.078491449356079, "mean_norm/layer8": 8.095423579216003, "mean_norm/layer9": 8.095584988594055, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 300 }, { "epoch": 0.13, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.387530775564506, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.338789701461792, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8547, "eval_samples_per_second": 20.329, "eval_steps_per_second": 0.675, "step": 300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.15, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.3923, "max_norm": 12.015610694885254, "max_norm/layer0": 11.587407112121582, "max_norm/layer1": 11.411787986755371, "max_norm/layer10": 11.574077606201172, "max_norm/layer11": 11.51120376586914, "max_norm/layer12": 11.12320613861084, "max_norm/layer13": 11.032407760620117, "max_norm/layer14": 11.822674751281738, "max_norm/layer15": 11.238204956054688, "max_norm/layer16": 10.920355796813965, "max_norm/layer17": 11.699063301086426, "max_norm/layer18": 11.408402442932129, "max_norm/layer19": 11.491950035095215, "max_norm/layer2": 11.242212295532227, "max_norm/layer20": 11.323861122131348, "max_norm/layer21": 12.015610694885254, "max_norm/layer22": 11.565690040588379, "max_norm/layer23": 11.3798828125, "max_norm/layer3": 11.31166934967041, "max_norm/layer4": 11.336499214172363, "max_norm/layer5": 11.575148582458496, "max_norm/layer6": 11.771903038024902, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.338603973388672, "max_norm/layer9": 11.345176696777344, "mean_norm": 8.122111474474272, "mean_norm/layer0": 8.130385041236877, "mean_norm/layer1": 8.116739928722382, "mean_norm/layer10": 8.117430806159973, "mean_norm/layer11": 8.13034301996231, "mean_norm/layer12": 8.132402211427689, "mean_norm/layer13": 8.10273027420044, "mean_norm/layer14": 8.119827210903168, "mean_norm/layer15": 8.131300270557404, "mean_norm/layer16": 8.103004693984985, "mean_norm/layer17": 8.129256963729858, "mean_norm/layer18": 8.101572036743164, "mean_norm/layer19": 8.104348003864288, "mean_norm/layer2": 8.053901731967926, "mean_norm/layer20": 8.108955979347229, "mean_norm/layer21": 8.113863289356232, "mean_norm/layer22": 8.156916499137878, "mean_norm/layer23": 8.166612327098846, "mean_norm/layer3": 8.168688178062439, "mean_norm/layer4": 8.11172890663147, "mean_norm/layer5": 8.211617052555084, "mean_norm/layer6": 8.074544966220856, "mean_norm/layer7": 8.101724714040756, "mean_norm/layer8": 8.12110459804535, "mean_norm/layer9": 8.121676683425903, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 350 }, { "epoch": 0.15, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.3928604746433685, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.292882204055786, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8031, "eval_samples_per_second": 20.418, "eval_steps_per_second": 0.678, "step": 350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.17, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.3488, "max_norm": 12.052452087402344, "max_norm/layer0": 11.583168983459473, "max_norm/layer1": 11.448755264282227, "max_norm/layer10": 11.607074737548828, "max_norm/layer11": 11.51498794555664, "max_norm/layer12": 11.131906509399414, "max_norm/layer13": 11.042832374572754, "max_norm/layer14": 11.821359634399414, "max_norm/layer15": 11.259943962097168, "max_norm/layer16": 10.950507164001465, "max_norm/layer17": 11.704728126525879, "max_norm/layer18": 11.416481971740723, "max_norm/layer19": 11.509549140930176, "max_norm/layer2": 11.243173599243164, "max_norm/layer20": 11.331818580627441, "max_norm/layer21": 12.052452087402344, "max_norm/layer22": 11.601603507995605, "max_norm/layer23": 11.385972023010254, "max_norm/layer3": 11.330273628234863, "max_norm/layer4": 11.340890884399414, "max_norm/layer5": 11.589158058166504, "max_norm/layer6": 11.758391380310059, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.364471435546875, "max_norm/layer9": 11.363606452941895, "mean_norm": 8.146464373916388, "mean_norm/layer0": 8.147882997989655, "mean_norm/layer1": 8.137409269809723, "mean_norm/layer10": 8.143800973892212, "mean_norm/layer11": 8.15701961517334, "mean_norm/layer12": 8.159733355045319, "mean_norm/layer13": 8.12478882074356, "mean_norm/layer14": 8.144879519939423, "mean_norm/layer15": 8.15983933210373, "mean_norm/layer16": 8.124275922775269, "mean_norm/layer17": 8.154035031795502, "mean_norm/layer18": 8.12134873867035, "mean_norm/layer19": 8.123763740062714, "mean_norm/layer2": 8.06533831357956, "mean_norm/layer20": 8.130630254745483, "mean_norm/layer21": 8.135239839553833, "mean_norm/layer22": 8.187315464019775, "mean_norm/layer23": 8.198715567588806, "mean_norm/layer3": 8.200076937675476, "mean_norm/layer4": 8.13455080986023, "mean_norm/layer5": 8.252391397953033, "mean_norm/layer6": 8.09180998802185, "mean_norm/layer7": 8.12533888220787, "mean_norm/layer8": 8.147203147411346, "mean_norm/layer9": 8.147757053375244, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 400 }, { "epoch": 0.17, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.39780890148980097, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.262259006500244, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5766, "eval_samples_per_second": 20.818, "eval_steps_per_second": 0.691, "step": 400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.19, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.3177, "max_norm": 12.075408935546875, "max_norm/layer0": 11.58000373840332, "max_norm/layer1": 11.467397689819336, "max_norm/layer10": 11.6430082321167, "max_norm/layer11": 11.519189834594727, "max_norm/layer12": 11.167428016662598, "max_norm/layer13": 11.051277160644531, "max_norm/layer14": 11.820220947265625, "max_norm/layer15": 11.288527488708496, "max_norm/layer16": 10.984353065490723, "max_norm/layer17": 11.70883846282959, "max_norm/layer18": 11.42200756072998, "max_norm/layer19": 11.528905868530273, "max_norm/layer2": 11.243820190429688, "max_norm/layer20": 11.341607093811035, "max_norm/layer21": 12.075408935546875, "max_norm/layer22": 11.638215065002441, "max_norm/layer23": 11.391865730285645, "max_norm/layer3": 11.364630699157715, "max_norm/layer4": 11.353809356689453, "max_norm/layer5": 11.606606483459473, "max_norm/layer6": 11.743355751037598, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.400062561035156, "max_norm/layer9": 11.37598991394043, "mean_norm": 8.171071887016296, "mean_norm/layer0": 8.165462255477905, "mean_norm/layer1": 8.157464504241943, "mean_norm/layer10": 8.170145452022552, "mean_norm/layer11": 8.183974206447601, "mean_norm/layer12": 8.187600195407867, "mean_norm/layer13": 8.146990656852722, "mean_norm/layer14": 8.170723497867584, "mean_norm/layer15": 8.188680768013, "mean_norm/layer16": 8.146208465099335, "mean_norm/layer17": 8.179404616355896, "mean_norm/layer18": 8.141136407852173, "mean_norm/layer19": 8.14376151561737, "mean_norm/layer2": 8.07688194513321, "mean_norm/layer20": 8.152221620082855, "mean_norm/layer21": 8.15705955028534, "mean_norm/layer22": 8.21717494726181, "mean_norm/layer23": 8.23116946220398, "mean_norm/layer3": 8.231843888759613, "mean_norm/layer4": 8.15757131576538, "mean_norm/layer5": 8.294019222259521, "mean_norm/layer6": 8.10983818769455, "mean_norm/layer7": 8.148617386817932, "mean_norm/layer8": 8.17370468378067, "mean_norm/layer9": 8.174070537090302, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 450 }, { "epoch": 0.19, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.3994718973972086, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.232194423675537, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8086, "eval_samples_per_second": 20.409, "eval_steps_per_second": 0.677, "step": 450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.21, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2894, "max_norm": 12.08602237701416, "max_norm/layer0": 11.57630443572998, "max_norm/layer1": 11.500665664672852, "max_norm/layer10": 11.685675621032715, "max_norm/layer11": 11.524746894836426, "max_norm/layer12": 11.200533866882324, "max_norm/layer13": 11.057424545288086, "max_norm/layer14": 11.818695068359375, "max_norm/layer15": 11.327396392822266, "max_norm/layer16": 11.003171920776367, "max_norm/layer17": 11.71567440032959, "max_norm/layer18": 11.435552597045898, "max_norm/layer19": 11.560956954956055, "max_norm/layer2": 11.249007225036621, "max_norm/layer20": 11.35300350189209, "max_norm/layer21": 12.08602237701416, "max_norm/layer22": 11.681539535522461, "max_norm/layer23": 11.402434349060059, "max_norm/layer3": 11.39268684387207, "max_norm/layer4": 11.360640525817871, "max_norm/layer5": 11.629146575927734, "max_norm/layer6": 11.73115348815918, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.449997901916504, "max_norm/layer9": 11.38539981842041, "mean_norm": 8.196226223061482, "mean_norm/layer0": 8.182831525802612, "mean_norm/layer1": 8.177292108535767, "mean_norm/layer10": 8.197421550750732, "mean_norm/layer11": 8.212226867675781, "mean_norm/layer12": 8.216940701007843, "mean_norm/layer13": 8.170343518257141, "mean_norm/layer14": 8.197417199611664, "mean_norm/layer15": 8.218412935733795, "mean_norm/layer16": 8.168900430202484, "mean_norm/layer17": 8.205419719219208, "mean_norm/layer18": 8.161637961864471, "mean_norm/layer19": 8.164183616638184, "mean_norm/layer2": 8.088469088077545, "mean_norm/layer20": 8.17502224445343, "mean_norm/layer21": 8.179168939590454, "mean_norm/layer22": 8.248070120811462, "mean_norm/layer23": 8.263128936290741, "mean_norm/layer3": 8.263891696929932, "mean_norm/layer4": 8.180212199687958, "mean_norm/layer5": 8.336524426937103, "mean_norm/layer6": 8.128240823745728, "mean_norm/layer7": 8.172141283750534, "mean_norm/layer8": 8.200634181499481, "mean_norm/layer9": 8.20089727640152, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 500 }, { "epoch": 0.21, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4021610834621141, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.2090389728546143, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5576, "eval_samples_per_second": 20.852, "eval_steps_per_second": 0.692, "step": 500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.23, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2724, "max_norm": 12.093631744384766, "max_norm/layer0": 11.574031829833984, "max_norm/layer1": 11.520513534545898, "max_norm/layer10": 11.72606372833252, "max_norm/layer11": 11.533076286315918, "max_norm/layer12": 11.226149559020996, "max_norm/layer13": 11.076735496520996, "max_norm/layer14": 11.817575454711914, "max_norm/layer15": 11.362285614013672, "max_norm/layer16": 11.021040916442871, "max_norm/layer17": 11.723470687866211, "max_norm/layer18": 11.440601348876953, "max_norm/layer19": 11.586626052856445, "max_norm/layer2": 11.307050704956055, "max_norm/layer20": 11.366878509521484, "max_norm/layer21": 12.093631744384766, "max_norm/layer22": 11.715110778808594, "max_norm/layer23": 11.419413566589355, "max_norm/layer3": 11.408477783203125, "max_norm/layer4": 11.373757362365723, "max_norm/layer5": 11.641069412231445, "max_norm/layer6": 11.724522590637207, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.494658470153809, "max_norm/layer9": 11.404236793518066, "mean_norm": 8.221715872486433, "mean_norm/layer0": 8.199663996696472, "mean_norm/layer1": 8.197345733642578, "mean_norm/layer10": 8.224578857421875, "mean_norm/layer11": 8.241481006145477, "mean_norm/layer12": 8.246900916099548, "mean_norm/layer13": 8.194350957870483, "mean_norm/layer14": 8.224222719669342, "mean_norm/layer15": 8.249268531799316, "mean_norm/layer16": 8.192130506038666, "mean_norm/layer17": 8.23191773891449, "mean_norm/layer18": 8.183155179023743, "mean_norm/layer19": 8.184997946023941, "mean_norm/layer2": 8.100345313549042, "mean_norm/layer20": 8.198180854320526, "mean_norm/layer21": 8.201505959033966, "mean_norm/layer22": 8.27897161245346, "mean_norm/layer23": 8.2966029047966, "mean_norm/layer3": 8.295648694038391, "mean_norm/layer4": 8.202883422374725, "mean_norm/layer5": 8.379289329051971, "mean_norm/layer6": 8.146961510181427, "mean_norm/layer7": 8.195779234170914, "mean_norm/layer8": 8.22712391614914, "mean_norm/layer9": 8.227874100208282, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 550 }, { "epoch": 0.23, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4047083064617531, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.19132661819458, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8083, "eval_samples_per_second": 20.409, "eval_steps_per_second": 0.677, "step": 550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.25, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2613, "max_norm": 12.08575439453125, "max_norm/layer0": 11.57294750213623, "max_norm/layer1": 11.550745010375977, "max_norm/layer10": 11.778457641601562, "max_norm/layer11": 11.543680191040039, "max_norm/layer12": 11.26294231414795, "max_norm/layer13": 11.098902702331543, "max_norm/layer14": 11.818066596984863, "max_norm/layer15": 11.396076202392578, "max_norm/layer16": 11.038070678710938, "max_norm/layer17": 11.729777336120605, "max_norm/layer18": 11.44991683959961, "max_norm/layer19": 11.609344482421875, "max_norm/layer2": 11.325920104980469, "max_norm/layer20": 11.378867149353027, "max_norm/layer21": 12.08575439453125, "max_norm/layer22": 11.764599800109863, "max_norm/layer23": 11.429723739624023, "max_norm/layer3": 11.43395709991455, "max_norm/layer4": 11.382811546325684, "max_norm/layer5": 11.653532028198242, "max_norm/layer6": 11.715897560119629, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.53526782989502, "max_norm/layer9": 11.41949462890625, "mean_norm": 8.2477020782729, "mean_norm/layer0": 8.216517150402069, "mean_norm/layer1": 8.217063426971436, "mean_norm/layer10": 8.252220571041107, "mean_norm/layer11": 8.27081310749054, "mean_norm/layer12": 8.277320384979248, "mean_norm/layer13": 8.218484103679657, "mean_norm/layer14": 8.251877188682556, "mean_norm/layer15": 8.280709624290466, "mean_norm/layer16": 8.215820074081421, "mean_norm/layer17": 8.259000062942505, "mean_norm/layer18": 8.205557763576508, "mean_norm/layer19": 8.20718702673912, "mean_norm/layer2": 8.11178743839264, "mean_norm/layer20": 8.222057938575745, "mean_norm/layer21": 8.225264191627502, "mean_norm/layer22": 8.31117445230484, "mean_norm/layer23": 8.33020955324173, "mean_norm/layer3": 8.328413903713226, "mean_norm/layer4": 8.22685432434082, "mean_norm/layer5": 8.42192029953003, "mean_norm/layer6": 8.165671527385712, "mean_norm/layer7": 8.219844996929169, "mean_norm/layer8": 8.254268229007721, "mean_norm/layer9": 8.25481253862381, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 600 }, { "epoch": 0.25, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.40806674697720074, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.164001226425171, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8121, "eval_samples_per_second": 20.403, "eval_steps_per_second": 0.677, "step": 600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.27, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2317, "max_norm": 12.080315589904785, "max_norm/layer0": 11.57314395904541, "max_norm/layer1": 11.564712524414062, "max_norm/layer10": 11.826842308044434, "max_norm/layer11": 11.56205940246582, "max_norm/layer12": 11.327191352844238, "max_norm/layer13": 11.14234447479248, "max_norm/layer14": 11.822623252868652, "max_norm/layer15": 11.452949523925781, "max_norm/layer16": 11.063272476196289, "max_norm/layer17": 11.735552787780762, "max_norm/layer18": 11.489537239074707, "max_norm/layer19": 11.642096519470215, "max_norm/layer2": 11.34683895111084, "max_norm/layer20": 11.390698432922363, "max_norm/layer21": 12.080315589904785, "max_norm/layer22": 11.80964469909668, "max_norm/layer23": 11.444567680358887, "max_norm/layer3": 11.46610164642334, "max_norm/layer4": 11.389155387878418, "max_norm/layer5": 11.663924217224121, "max_norm/layer6": 11.711557388305664, "max_norm/layer7": 11.412418365478516, "max_norm/layer8": 11.58823299407959, "max_norm/layer9": 11.441153526306152, "mean_norm": 8.27368176728487, "mean_norm/layer0": 8.23319536447525, "mean_norm/layer1": 8.236526012420654, "mean_norm/layer10": 8.279936909675598, "mean_norm/layer11": 8.300039291381836, "mean_norm/layer12": 8.308358132839203, "mean_norm/layer13": 8.24279397726059, "mean_norm/layer14": 8.280017256736755, "mean_norm/layer15": 8.31208449602127, "mean_norm/layer16": 8.239376664161682, "mean_norm/layer17": 8.286569893360138, "mean_norm/layer18": 8.228154420852661, "mean_norm/layer19": 8.229794263839722, "mean_norm/layer2": 8.122508347034454, "mean_norm/layer20": 8.247145473957062, "mean_norm/layer21": 8.249900996685028, "mean_norm/layer22": 8.343108773231506, "mean_norm/layer23": 8.363870322704315, "mean_norm/layer3": 8.359816431999207, "mean_norm/layer4": 8.249790847301483, "mean_norm/layer5": 8.46416860818863, "mean_norm/layer6": 8.183874189853668, "mean_norm/layer7": 8.243731617927551, "mean_norm/layer8": 8.281560719013214, "mean_norm/layer9": 8.282039403915405, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 650 }, { "epoch": 0.27, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.40971351853429216, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.150172233581543, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.798, "eval_samples_per_second": 20.427, "eval_steps_per_second": 0.678, "step": 650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.29, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2188, "max_norm": 12.064549446105957, "max_norm/layer0": 11.576369285583496, "max_norm/layer1": 11.57625961303711, "max_norm/layer10": 11.87590217590332, "max_norm/layer11": 11.576005935668945, "max_norm/layer12": 11.397974014282227, "max_norm/layer13": 11.20036506652832, "max_norm/layer14": 11.824828147888184, "max_norm/layer15": 11.515402793884277, "max_norm/layer16": 11.112325668334961, "max_norm/layer17": 11.739395141601562, "max_norm/layer18": 11.53075885772705, "max_norm/layer19": 11.668770790100098, "max_norm/layer2": 11.371235847473145, "max_norm/layer20": 11.404346466064453, "max_norm/layer21": 12.064549446105957, "max_norm/layer22": 11.857187271118164, "max_norm/layer23": 11.460153579711914, "max_norm/layer3": 11.484306335449219, "max_norm/layer4": 11.393518447875977, "max_norm/layer5": 11.679058074951172, "max_norm/layer6": 11.7113618850708, "max_norm/layer7": 11.412549018859863, "max_norm/layer8": 11.63630485534668, "max_norm/layer9": 11.468382835388184, "mean_norm": 8.29998386775454, "mean_norm/layer0": 8.249696731567383, "mean_norm/layer1": 8.255469501018524, "mean_norm/layer10": 8.307538092136383, "mean_norm/layer11": 8.328807175159454, "mean_norm/layer12": 8.340057134628296, "mean_norm/layer13": 8.267650306224823, "mean_norm/layer14": 8.308513700962067, "mean_norm/layer15": 8.343885838985443, "mean_norm/layer16": 8.263654291629791, "mean_norm/layer17": 8.315043985843658, "mean_norm/layer18": 8.251324594020844, "mean_norm/layer19": 8.253050774335861, "mean_norm/layer2": 8.132669448852539, "mean_norm/layer20": 8.273239970207214, "mean_norm/layer21": 8.275495648384094, "mean_norm/layer22": 8.376473069190979, "mean_norm/layer23": 8.397179186344147, "mean_norm/layer3": 8.391516983509064, "mean_norm/layer4": 8.27236133813858, "mean_norm/layer5": 8.507023572921753, "mean_norm/layer6": 8.20206767320633, "mean_norm/layer7": 8.268005192279816, "mean_norm/layer8": 8.309515058994293, "mean_norm/layer9": 8.309373557567596, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 700 }, { "epoch": 0.29, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.411676664922549, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.1364951133728027, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7803, "eval_samples_per_second": 20.458, "eval_steps_per_second": 0.679, "step": 700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.31, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.2161, "max_norm": 12.05309772491455, "max_norm/layer0": 11.57707691192627, "max_norm/layer1": 11.590497970581055, "max_norm/layer10": 11.933767318725586, "max_norm/layer11": 11.590163230895996, "max_norm/layer12": 11.48369312286377, "max_norm/layer13": 11.255187034606934, "max_norm/layer14": 11.825422286987305, "max_norm/layer15": 11.571812629699707, "max_norm/layer16": 11.15307331085205, "max_norm/layer17": 11.7452392578125, "max_norm/layer18": 11.56918716430664, "max_norm/layer19": 11.707026481628418, "max_norm/layer2": 11.40218448638916, "max_norm/layer20": 11.431868553161621, "max_norm/layer21": 12.05309772491455, "max_norm/layer22": 11.90449333190918, "max_norm/layer23": 11.471346855163574, "max_norm/layer3": 11.509933471679688, "max_norm/layer4": 11.459664344787598, "max_norm/layer5": 11.687596321105957, "max_norm/layer6": 11.70588207244873, "max_norm/layer7": 11.449671745300293, "max_norm/layer8": 11.691574096679688, "max_norm/layer9": 11.537601470947266, "mean_norm": 8.326080996543169, "mean_norm/layer0": 8.265921652317047, "mean_norm/layer1": 8.27424931526184, "mean_norm/layer10": 8.334565043449402, "mean_norm/layer11": 8.358085632324219, "mean_norm/layer12": 8.371635675430298, "mean_norm/layer13": 8.292467653751373, "mean_norm/layer14": 8.336614668369293, "mean_norm/layer15": 8.375074326992035, "mean_norm/layer16": 8.288271248340607, "mean_norm/layer17": 8.343531310558319, "mean_norm/layer18": 8.274474322795868, "mean_norm/layer19": 8.276240915060043, "mean_norm/layer2": 8.142491519451141, "mean_norm/layer20": 8.299282789230347, "mean_norm/layer21": 8.301438212394714, "mean_norm/layer22": 8.409608781337738, "mean_norm/layer23": 8.431357860565186, "mean_norm/layer3": 8.42233693599701, "mean_norm/layer4": 8.29524427652359, "mean_norm/layer5": 8.54966390132904, "mean_norm/layer6": 8.2197967171669, "mean_norm/layer7": 8.291634261608124, "mean_norm/layer8": 8.336127936840057, "mean_norm/layer9": 8.335828959941864, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 750 }, { "epoch": 0.31, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.41466194538072465, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.1243374347686768, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7875, "eval_samples_per_second": 20.445, "eval_steps_per_second": 0.679, "step": 750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.33, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1922, "max_norm": 12.044909477233887, "max_norm/layer0": 11.577107429504395, "max_norm/layer1": 11.596969604492188, "max_norm/layer10": 11.989384651184082, "max_norm/layer11": 11.607263565063477, "max_norm/layer12": 11.563121795654297, "max_norm/layer13": 11.30004596710205, "max_norm/layer14": 11.83565616607666, "max_norm/layer15": 11.635966300964355, "max_norm/layer16": 11.215364456176758, "max_norm/layer17": 11.751420974731445, "max_norm/layer18": 11.606756210327148, "max_norm/layer19": 11.731042861938477, "max_norm/layer2": 11.428869247436523, "max_norm/layer20": 11.478826522827148, "max_norm/layer21": 12.044909477233887, "max_norm/layer22": 11.962320327758789, "max_norm/layer23": 11.527593612670898, "max_norm/layer3": 11.53365707397461, "max_norm/layer4": 11.52773666381836, "max_norm/layer5": 11.69833755493164, "max_norm/layer6": 11.700189590454102, "max_norm/layer7": 11.472933769226074, "max_norm/layer8": 11.752439498901367, "max_norm/layer9": 11.594074249267578, "mean_norm": 8.351811222732067, "mean_norm/layer0": 8.281863927841187, "mean_norm/layer1": 8.29244977235794, "mean_norm/layer10": 8.361223697662354, "mean_norm/layer11": 8.386799097061157, "mean_norm/layer12": 8.403019607067108, "mean_norm/layer13": 8.316332519054413, "mean_norm/layer14": 8.364771544933319, "mean_norm/layer15": 8.405999541282654, "mean_norm/layer16": 8.312246263027191, "mean_norm/layer17": 8.372030258178711, "mean_norm/layer18": 8.297933518886566, "mean_norm/layer19": 8.299460768699646, "mean_norm/layer2": 8.151886761188507, "mean_norm/layer20": 8.324509799480438, "mean_norm/layer21": 8.326754689216614, "mean_norm/layer22": 8.443054556846619, "mean_norm/layer23": 8.464609026908875, "mean_norm/layer3": 8.452716946601868, "mean_norm/layer4": 8.317551970481873, "mean_norm/layer5": 8.592187523841858, "mean_norm/layer6": 8.237367451190948, "mean_norm/layer7": 8.314523756504059, "mean_norm/layer8": 8.362704694271088, "mean_norm/layer9": 8.36147165298462, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 800 }, { "epoch": 0.33, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.41583821077864713, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.110368251800537, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7951, "eval_samples_per_second": 20.432, "eval_steps_per_second": 0.678, "step": 800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.35, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1722, "max_norm": 12.041813850402832, "max_norm/layer0": 11.581586837768555, "max_norm/layer1": 11.61563491821289, "max_norm/layer10": 12.041813850402832, "max_norm/layer11": 11.62158203125, "max_norm/layer12": 11.668936729431152, "max_norm/layer13": 11.349258422851562, "max_norm/layer14": 11.871787071228027, "max_norm/layer15": 11.716175079345703, "max_norm/layer16": 11.261540412902832, "max_norm/layer17": 11.757204055786133, "max_norm/layer18": 11.649191856384277, "max_norm/layer19": 11.76467514038086, "max_norm/layer2": 11.455350875854492, "max_norm/layer20": 11.54249382019043, "max_norm/layer21": 12.034183502197266, "max_norm/layer22": 12.032604217529297, "max_norm/layer23": 11.640424728393555, "max_norm/layer3": 11.551873207092285, "max_norm/layer4": 11.593846321105957, "max_norm/layer5": 11.747194290161133, "max_norm/layer6": 11.696702003479004, "max_norm/layer7": 11.496893882751465, "max_norm/layer8": 11.801105499267578, "max_norm/layer9": 11.650264739990234, "mean_norm": 8.377701930701733, "mean_norm/layer0": 8.297932505607605, "mean_norm/layer1": 8.310682237148285, "mean_norm/layer10": 8.388074398040771, "mean_norm/layer11": 8.416272222995758, "mean_norm/layer12": 8.433896124362946, "mean_norm/layer13": 8.340609431266785, "mean_norm/layer14": 8.393010914325714, "mean_norm/layer15": 8.437807321548462, "mean_norm/layer16": 8.33694452047348, "mean_norm/layer17": 8.400605857372284, "mean_norm/layer18": 8.321976900100708, "mean_norm/layer19": 8.323336660861969, "mean_norm/layer2": 8.161349713802338, "mean_norm/layer20": 8.351431608200073, "mean_norm/layer21": 8.352801442146301, "mean_norm/layer22": 8.476556599140167, "mean_norm/layer23": 8.498172104358673, "mean_norm/layer3": 8.483105719089508, "mean_norm/layer4": 8.33917647600174, "mean_norm/layer5": 8.63397741317749, "mean_norm/layer6": 8.25437742471695, "mean_norm/layer7": 8.337139964103699, "mean_norm/layer8": 8.388812839984894, "mean_norm/layer9": 8.386795938014984, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 850 }, { "epoch": 0.35, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.41578142555254055, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0969085693359375, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8094, "eval_samples_per_second": 20.407, "eval_steps_per_second": 0.677, "step": 850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.38, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1726, "max_norm": 12.105155944824219, "max_norm/layer0": 11.583524703979492, "max_norm/layer1": 11.676701545715332, "max_norm/layer10": 12.105155944824219, "max_norm/layer11": 11.638466835021973, "max_norm/layer12": 11.77223014831543, "max_norm/layer13": 11.394583702087402, "max_norm/layer14": 11.909969329833984, "max_norm/layer15": 11.791295051574707, "max_norm/layer16": 11.316922187805176, "max_norm/layer17": 11.762696266174316, "max_norm/layer18": 11.696808815002441, "max_norm/layer19": 11.803051948547363, "max_norm/layer2": 11.476975440979004, "max_norm/layer20": 11.61272144317627, "max_norm/layer21": 12.020544052124023, "max_norm/layer22": 12.087778091430664, "max_norm/layer23": 11.726238250732422, "max_norm/layer3": 11.56999683380127, "max_norm/layer4": 11.669652938842773, "max_norm/layer5": 11.824197769165039, "max_norm/layer6": 11.70715045928955, "max_norm/layer7": 11.523516654968262, "max_norm/layer8": 11.856184005737305, "max_norm/layer9": 11.70484447479248, "mean_norm": 8.403302758932114, "mean_norm/layer0": 8.313547551631927, "mean_norm/layer1": 8.32844340801239, "mean_norm/layer10": 8.414072811603546, "mean_norm/layer11": 8.445135712623596, "mean_norm/layer12": 8.465462267398834, "mean_norm/layer13": 8.364917397499084, "mean_norm/layer14": 8.421625912189484, "mean_norm/layer15": 8.468998491764069, "mean_norm/layer16": 8.361238062381744, "mean_norm/layer17": 8.429136097431183, "mean_norm/layer18": 8.345595300197601, "mean_norm/layer19": 8.347301244735718, "mean_norm/layer2": 8.170057713985443, "mean_norm/layer20": 8.378221929073334, "mean_norm/layer21": 8.378659009933472, "mean_norm/layer22": 8.510486662387848, "mean_norm/layer23": 8.53170108795166, "mean_norm/layer3": 8.512450098991394, "mean_norm/layer4": 8.360101521015167, "mean_norm/layer5": 8.675426006317139, "mean_norm/layer6": 8.27113664150238, "mean_norm/layer7": 8.359546661376953, "mean_norm/layer8": 8.414047420024872, "mean_norm/layer9": 8.411957204341888, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 900 }, { "epoch": 0.38, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4186653038212401, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0817902088165283, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5214, "eval_samples_per_second": 20.918, "eval_steps_per_second": 0.694, "step": 900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.4, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1672, "max_norm": 12.155872344970703, "max_norm/layer0": 11.587013244628906, "max_norm/layer1": 11.7393217086792, "max_norm/layer10": 12.155872344970703, "max_norm/layer11": 11.661779403686523, "max_norm/layer12": 11.862051963806152, "max_norm/layer13": 11.456026077270508, "max_norm/layer14": 11.942784309387207, "max_norm/layer15": 11.870194435119629, "max_norm/layer16": 11.392291069030762, "max_norm/layer17": 11.770665168762207, "max_norm/layer18": 11.740965843200684, "max_norm/layer19": 11.83622932434082, "max_norm/layer2": 11.501779556274414, "max_norm/layer20": 11.678656578063965, "max_norm/layer21": 12.005668640136719, "max_norm/layer22": 12.143045425415039, "max_norm/layer23": 11.798517227172852, "max_norm/layer3": 11.589555740356445, "max_norm/layer4": 11.730375289916992, "max_norm/layer5": 11.893560409545898, "max_norm/layer6": 11.800168991088867, "max_norm/layer7": 11.626232147216797, "max_norm/layer8": 11.903609275817871, "max_norm/layer9": 11.769264221191406, "mean_norm": 8.42872379720211, "mean_norm/layer0": 8.329014301300049, "mean_norm/layer1": 8.345844089984894, "mean_norm/layer10": 8.440021395683289, "mean_norm/layer11": 8.47356379032135, "mean_norm/layer12": 8.4962397813797, "mean_norm/layer13": 8.388897180557251, "mean_norm/layer14": 8.449989914894104, "mean_norm/layer15": 8.499238908290863, "mean_norm/layer16": 8.385041534900665, "mean_norm/layer17": 8.458029627799988, "mean_norm/layer18": 8.369693100452423, "mean_norm/layer19": 8.371399164199829, "mean_norm/layer2": 8.178799033164978, "mean_norm/layer20": 8.405226469039917, "mean_norm/layer21": 8.40516346693039, "mean_norm/layer22": 8.544622302055359, "mean_norm/layer23": 8.565294981002808, "mean_norm/layer3": 8.541715741157532, "mean_norm/layer4": 8.380447745323181, "mean_norm/layer5": 8.717021226882935, "mean_norm/layer6": 8.287675678730011, "mean_norm/layer7": 8.38047194480896, "mean_norm/layer8": 8.439296841621399, "mean_norm/layer9": 8.436662912368774, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 950 }, { "epoch": 0.4, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.41965904527810566, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0697402954101562, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8068, "eval_samples_per_second": 20.412, "eval_steps_per_second": 0.678, "step": 950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.42, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1499, "max_norm": 12.205371856689453, "max_norm/layer0": 11.665349960327148, "max_norm/layer1": 11.794570922851562, "max_norm/layer10": 12.205371856689453, "max_norm/layer11": 11.683103561401367, "max_norm/layer12": 11.96533489227295, "max_norm/layer13": 11.50973892211914, "max_norm/layer14": 11.985956192016602, "max_norm/layer15": 11.945061683654785, "max_norm/layer16": 11.481783866882324, "max_norm/layer17": 11.784865379333496, "max_norm/layer18": 11.786661148071289, "max_norm/layer19": 11.881720542907715, "max_norm/layer2": 11.518780708312988, "max_norm/layer20": 11.752313613891602, "max_norm/layer21": 11.9920015335083, "max_norm/layer22": 12.204444885253906, "max_norm/layer23": 11.857336044311523, "max_norm/layer3": 11.719679832458496, "max_norm/layer4": 11.798518180847168, "max_norm/layer5": 11.96689224243164, "max_norm/layer6": 11.870284080505371, "max_norm/layer7": 11.738767623901367, "max_norm/layer8": 11.964406967163086, "max_norm/layer9": 11.882627487182617, "mean_norm": 8.453645870089531, "mean_norm/layer0": 8.3440882563591, "mean_norm/layer1": 8.363113164901733, "mean_norm/layer10": 8.465011715888977, "mean_norm/layer11": 8.501566469669342, "mean_norm/layer12": 8.526647329330444, "mean_norm/layer13": 8.4126957654953, "mean_norm/layer14": 8.477688908576965, "mean_norm/layer15": 8.52941745519638, "mean_norm/layer16": 8.408942818641663, "mean_norm/layer17": 8.486901998519897, "mean_norm/layer18": 8.393563508987427, "mean_norm/layer19": 8.395319759845734, "mean_norm/layer2": 8.187123000621796, "mean_norm/layer20": 8.431950569152832, "mean_norm/layer21": 8.430995404720306, "mean_norm/layer22": 8.57761299610138, "mean_norm/layer23": 8.598110377788544, "mean_norm/layer3": 8.570252418518066, "mean_norm/layer4": 8.400231778621674, "mean_norm/layer5": 8.75737339258194, "mean_norm/layer6": 8.30407863855362, "mean_norm/layer7": 8.400870144367218, "mean_norm/layer8": 8.463805377483368, "mean_norm/layer9": 8.460139632225037, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1000 }, { "epoch": 0.42, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4205027114945466, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.066149950027466, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5243, "eval_samples_per_second": 20.912, "eval_steps_per_second": 0.694, "step": 1000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.44, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.137, "max_norm": 12.26101303100586, "max_norm/layer0": 11.757697105407715, "max_norm/layer1": 11.850423812866211, "max_norm/layer10": 12.26101303100586, "max_norm/layer11": 11.710984230041504, "max_norm/layer12": 12.059286117553711, "max_norm/layer13": 11.577807426452637, "max_norm/layer14": 12.023432731628418, "max_norm/layer15": 12.022744178771973, "max_norm/layer16": 11.563203811645508, "max_norm/layer17": 11.832247734069824, "max_norm/layer18": 11.830646514892578, "max_norm/layer19": 11.917702674865723, "max_norm/layer2": 11.566544532775879, "max_norm/layer20": 11.846986770629883, "max_norm/layer21": 11.974418640136719, "max_norm/layer22": 12.259807586669922, "max_norm/layer23": 11.933194160461426, "max_norm/layer3": 11.790570259094238, "max_norm/layer4": 11.847346305847168, "max_norm/layer5": 12.058023452758789, "max_norm/layer6": 11.934420585632324, "max_norm/layer7": 11.859853744506836, "max_norm/layer8": 12.027948379516602, "max_norm/layer9": 12.007089614868164, "mean_norm": 8.478731632232666, "mean_norm/layer0": 8.359271585941315, "mean_norm/layer1": 8.380109190940857, "mean_norm/layer10": 8.489783465862274, "mean_norm/layer11": 8.528929233551025, "mean_norm/layer12": 8.557556688785553, "mean_norm/layer13": 8.436564564704895, "mean_norm/layer14": 8.50514006614685, "mean_norm/layer15": 8.559872150421143, "mean_norm/layer16": 8.43321669101715, "mean_norm/layer17": 8.515621662139893, "mean_norm/layer18": 8.417644321918488, "mean_norm/layer19": 8.419948518276215, "mean_norm/layer2": 8.196061968803406, "mean_norm/layer20": 8.459028244018555, "mean_norm/layer21": 8.457358598709106, "mean_norm/layer22": 8.611605882644653, "mean_norm/layer23": 8.631408274173737, "mean_norm/layer3": 8.599063694477081, "mean_norm/layer4": 8.419784009456635, "mean_norm/layer5": 8.797651767730713, "mean_norm/layer6": 8.320107817649841, "mean_norm/layer7": 8.4212247133255, "mean_norm/layer8": 8.488442122936249, "mean_norm/layer9": 8.48416393995285, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1050 }, { "epoch": 0.44, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.42164247210425765, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0529024600982666, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8004, "eval_samples_per_second": 20.423, "eval_steps_per_second": 0.678, "step": 1050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.46, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1325, "max_norm": 12.337430000305176, "max_norm/layer0": 11.839350700378418, "max_norm/layer1": 11.910687446594238, "max_norm/layer10": 12.316972732543945, "max_norm/layer11": 11.7444486618042, "max_norm/layer12": 12.147137641906738, "max_norm/layer13": 11.644682884216309, "max_norm/layer14": 12.059837341308594, "max_norm/layer15": 12.106205940246582, "max_norm/layer16": 11.641736030578613, "max_norm/layer17": 11.914681434631348, "max_norm/layer18": 11.873185157775879, "max_norm/layer19": 11.963512420654297, "max_norm/layer2": 11.602706909179688, "max_norm/layer20": 11.907248497009277, "max_norm/layer21": 11.956596374511719, "max_norm/layer22": 12.337430000305176, "max_norm/layer23": 12.008430480957031, "max_norm/layer3": 11.857219696044922, "max_norm/layer4": 11.907477378845215, "max_norm/layer5": 12.181724548339844, "max_norm/layer6": 12.007532119750977, "max_norm/layer7": 12.028894424438477, "max_norm/layer8": 12.075993537902832, "max_norm/layer9": 12.120156288146973, "mean_norm": 8.503541881839434, "mean_norm/layer0": 8.374323666095734, "mean_norm/layer1": 8.396947979927063, "mean_norm/layer10": 8.514197707176208, "mean_norm/layer11": 8.556173324584961, "mean_norm/layer12": 8.588340997695923, "mean_norm/layer13": 8.459864497184753, "mean_norm/layer14": 8.53289008140564, "mean_norm/layer15": 8.589832186698914, "mean_norm/layer16": 8.457439363002777, "mean_norm/layer17": 8.544645309448242, "mean_norm/layer18": 8.441946268081665, "mean_norm/layer19": 8.444604992866516, "mean_norm/layer2": 8.204352736473083, "mean_norm/layer20": 8.486289203166962, "mean_norm/layer21": 8.483921110630035, "mean_norm/layer22": 8.645121037960052, "mean_norm/layer23": 8.664347052574158, "mean_norm/layer3": 8.627211809158325, "mean_norm/layer4": 8.439228117465973, "mean_norm/layer5": 8.836770415306091, "mean_norm/layer6": 8.33525162935257, "mean_norm/layer7": 8.441284954547882, "mean_norm/layer8": 8.512612342834473, "mean_norm/layer9": 8.507408380508423, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1100 }, { "epoch": 0.46, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.422713279225125, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.053382396697998, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8038, "eval_samples_per_second": 20.417, "eval_steps_per_second": 0.678, "step": 1100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.48, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1134, "max_norm": 12.390501022338867, "max_norm/layer0": 11.916831016540527, "max_norm/layer1": 11.991969108581543, "max_norm/layer10": 12.356989860534668, "max_norm/layer11": 11.778839111328125, "max_norm/layer12": 12.239680290222168, "max_norm/layer13": 11.736593246459961, "max_norm/layer14": 12.143863677978516, "max_norm/layer15": 12.180139541625977, "max_norm/layer16": 11.728737831115723, "max_norm/layer17": 12.01159381866455, "max_norm/layer18": 11.933110237121582, "max_norm/layer19": 12.001410484313965, "max_norm/layer2": 11.658327102661133, "max_norm/layer20": 11.978069305419922, "max_norm/layer21": 11.949234008789062, "max_norm/layer22": 12.390501022338867, "max_norm/layer23": 12.06468677520752, "max_norm/layer3": 11.926894187927246, "max_norm/layer4": 11.99174976348877, "max_norm/layer5": 12.265400886535645, "max_norm/layer6": 12.064791679382324, "max_norm/layer7": 12.149833679199219, "max_norm/layer8": 12.13364028930664, "max_norm/layer9": 12.21767807006836, "mean_norm": 8.52769010514021, "mean_norm/layer0": 8.388884007930756, "mean_norm/layer1": 8.41365897655487, "mean_norm/layer10": 8.53753811120987, "mean_norm/layer11": 8.58243614435196, "mean_norm/layer12": 8.618303418159485, "mean_norm/layer13": 8.482500731945038, "mean_norm/layer14": 8.5594362616539, "mean_norm/layer15": 8.619120597839355, "mean_norm/layer16": 8.481026113033295, "mean_norm/layer17": 8.573175191879272, "mean_norm/layer18": 8.466035664081573, "mean_norm/layer19": 8.468759298324585, "mean_norm/layer2": 8.21207869052887, "mean_norm/layer20": 8.513489484786987, "mean_norm/layer21": 8.50997406244278, "mean_norm/layer22": 8.67935174703598, "mean_norm/layer23": 8.69653707742691, "mean_norm/layer3": 8.654048144817352, "mean_norm/layer4": 8.45800656080246, "mean_norm/layer5": 8.874925374984741, "mean_norm/layer6": 8.349959671497345, "mean_norm/layer7": 8.460034430027008, "mean_norm/layer8": 8.535409569740295, "mean_norm/layer9": 8.529873192310333, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1150 }, { "epoch": 0.48, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.42448984558474584, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.033704996109009, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5345, "eval_samples_per_second": 20.894, "eval_steps_per_second": 0.694, "step": 1150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.5, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0942, "max_norm": 12.468120574951172, "max_norm/layer0": 11.995326042175293, "max_norm/layer1": 12.067697525024414, "max_norm/layer10": 12.403990745544434, "max_norm/layer11": 11.817073822021484, "max_norm/layer12": 12.339508056640625, "max_norm/layer13": 11.813336372375488, "max_norm/layer14": 12.205154418945312, "max_norm/layer15": 12.247501373291016, "max_norm/layer16": 11.802889823913574, "max_norm/layer17": 12.11780834197998, "max_norm/layer18": 11.991769790649414, "max_norm/layer19": 12.04055404663086, "max_norm/layer2": 11.691339492797852, "max_norm/layer20": 12.061504364013672, "max_norm/layer21": 11.942378997802734, "max_norm/layer22": 12.468120574951172, "max_norm/layer23": 12.125564575195312, "max_norm/layer3": 12.011069297790527, "max_norm/layer4": 12.092073440551758, "max_norm/layer5": 12.332050323486328, "max_norm/layer6": 12.111506462097168, "max_norm/layer7": 12.237801551818848, "max_norm/layer8": 12.18825626373291, "max_norm/layer9": 12.341841697692871, "mean_norm": 8.55142513414224, "mean_norm/layer0": 8.403229653835297, "mean_norm/layer1": 8.430038452148438, "mean_norm/layer10": 8.560727715492249, "mean_norm/layer11": 8.608600378036499, "mean_norm/layer12": 8.647474765777588, "mean_norm/layer13": 8.504248023033142, "mean_norm/layer14": 8.58581668138504, "mean_norm/layer15": 8.647967278957367, "mean_norm/layer16": 8.503765046596527, "mean_norm/layer17": 8.601675927639008, "mean_norm/layer18": 8.490412592887878, "mean_norm/layer19": 8.492941200733185, "mean_norm/layer2": 8.219275295734406, "mean_norm/layer20": 8.539772391319275, "mean_norm/layer21": 8.53559297323227, "mean_norm/layer22": 8.712083876132965, "mean_norm/layer23": 8.729129493236542, "mean_norm/layer3": 8.680878758430481, "mean_norm/layer4": 8.476042687892914, "mean_norm/layer5": 8.91216629743576, "mean_norm/layer6": 8.364468932151794, "mean_norm/layer7": 8.478329598903656, "mean_norm/layer8": 8.557778775691986, "mean_norm/layer9": 8.551786422729492, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1200 }, { "epoch": 0.5, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.425163156122867, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0296287536621094, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7916, "eval_samples_per_second": 20.438, "eval_steps_per_second": 0.678, "step": 1200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.52, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.1078, "max_norm": 12.530866622924805, "max_norm/layer0": 12.061227798461914, "max_norm/layer1": 12.141142845153809, "max_norm/layer10": 12.451057434082031, "max_norm/layer11": 11.885611534118652, "max_norm/layer12": 12.420894622802734, "max_norm/layer13": 11.879868507385254, "max_norm/layer14": 12.285859107971191, "max_norm/layer15": 12.319154739379883, "max_norm/layer16": 11.870779037475586, "max_norm/layer17": 12.209052085876465, "max_norm/layer18": 12.042786598205566, "max_norm/layer19": 12.080160140991211, "max_norm/layer2": 11.76501178741455, "max_norm/layer20": 12.142309188842773, "max_norm/layer21": 12.006357192993164, "max_norm/layer22": 12.530866622924805, "max_norm/layer23": 12.205020904541016, "max_norm/layer3": 12.123080253601074, "max_norm/layer4": 12.156495094299316, "max_norm/layer5": 12.430468559265137, "max_norm/layer6": 12.177638053894043, "max_norm/layer7": 12.356688499450684, "max_norm/layer8": 12.309911727905273, "max_norm/layer9": 12.442432403564453, "mean_norm": 8.574853877226511, "mean_norm/layer0": 8.417532444000244, "mean_norm/layer1": 8.446242809295654, "mean_norm/layer10": 8.583423614501953, "mean_norm/layer11": 8.634363651275635, "mean_norm/layer12": 8.676055133342743, "mean_norm/layer13": 8.525701999664307, "mean_norm/layer14": 8.611644744873047, "mean_norm/layer15": 8.676322281360626, "mean_norm/layer16": 8.526974976062775, "mean_norm/layer17": 8.629515528678894, "mean_norm/layer18": 8.514853537082672, "mean_norm/layer19": 8.516682028770447, "mean_norm/layer2": 8.226419508457184, "mean_norm/layer20": 8.565673828125, "mean_norm/layer21": 8.56021511554718, "mean_norm/layer22": 8.744957864284515, "mean_norm/layer23": 8.761150598526001, "mean_norm/layer3": 8.706950187683105, "mean_norm/layer4": 8.49384981393814, "mean_norm/layer5": 8.949612021446228, "mean_norm/layer6": 8.378373205661774, "mean_norm/layer7": 8.496361255645752, "mean_norm/layer8": 8.580375611782074, "mean_norm/layer9": 8.573241293430328, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1250 }, { "epoch": 0.52, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4257472327342492, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.0218803882598877, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7879, "eval_samples_per_second": 20.445, "eval_steps_per_second": 0.679, "step": 1250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.54, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.086, "max_norm": 12.616530418395996, "max_norm/layer0": 12.120105743408203, "max_norm/layer1": 12.24160385131836, "max_norm/layer10": 12.489425659179688, "max_norm/layer11": 11.951299667358398, "max_norm/layer12": 12.510804176330566, "max_norm/layer13": 11.954564094543457, "max_norm/layer14": 12.374727249145508, "max_norm/layer15": 12.41003131866455, "max_norm/layer16": 11.95055866241455, "max_norm/layer17": 12.313188552856445, "max_norm/layer18": 12.117609977722168, "max_norm/layer19": 12.119937896728516, "max_norm/layer2": 11.798491477966309, "max_norm/layer20": 12.230223655700684, "max_norm/layer21": 12.09094524383545, "max_norm/layer22": 12.616530418395996, "max_norm/layer23": 12.287936210632324, "max_norm/layer3": 12.218461990356445, "max_norm/layer4": 12.223498344421387, "max_norm/layer5": 12.541898727416992, "max_norm/layer6": 12.239702224731445, "max_norm/layer7": 12.441795349121094, "max_norm/layer8": 12.388147354125977, "max_norm/layer9": 12.528850555419922, "mean_norm": 8.597911283373833, "mean_norm/layer0": 8.4317027926445, "mean_norm/layer1": 8.461981654167175, "mean_norm/layer10": 8.605356931686401, "mean_norm/layer11": 8.659491837024689, "mean_norm/layer12": 8.704477965831757, "mean_norm/layer13": 8.547408878803253, "mean_norm/layer14": 8.637555420398712, "mean_norm/layer15": 8.704207181930542, "mean_norm/layer16": 8.54949301481247, "mean_norm/layer17": 8.657357454299927, "mean_norm/layer18": 8.539100170135498, "mean_norm/layer19": 8.540253460407257, "mean_norm/layer2": 8.23346322774887, "mean_norm/layer20": 8.592048525810242, "mean_norm/layer21": 8.585165977478027, "mean_norm/layer22": 8.777146875858307, "mean_norm/layer23": 8.792299032211304, "mean_norm/layer3": 8.732121765613556, "mean_norm/layer4": 8.511165499687195, "mean_norm/layer5": 8.986108601093292, "mean_norm/layer6": 8.391669809818268, "mean_norm/layer7": 8.513608872890472, "mean_norm/layer8": 8.602046430110931, "mean_norm/layer9": 8.594639420509338, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1300 }, { "epoch": 0.54, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.42775093999829644, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.009110927581787, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8152, "eval_samples_per_second": 20.397, "eval_steps_per_second": 0.677, "step": 1300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.56, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0909, "max_norm": 12.686294555664062, "max_norm/layer0": 12.181984901428223, "max_norm/layer1": 12.317867279052734, "max_norm/layer10": 12.543929100036621, "max_norm/layer11": 12.017821311950684, "max_norm/layer12": 12.592409133911133, "max_norm/layer13": 12.018542289733887, "max_norm/layer14": 12.431426048278809, "max_norm/layer15": 12.49692153930664, "max_norm/layer16": 12.016731262207031, "max_norm/layer17": 12.427252769470215, "max_norm/layer18": 12.205350875854492, "max_norm/layer19": 12.160531044006348, "max_norm/layer2": 11.837761878967285, "max_norm/layer20": 12.30910587310791, "max_norm/layer21": 12.182352066040039, "max_norm/layer22": 12.686294555664062, "max_norm/layer23": 12.399474143981934, "max_norm/layer3": 12.289910316467285, "max_norm/layer4": 12.31454849243164, "max_norm/layer5": 12.639134407043457, "max_norm/layer6": 12.315422058105469, "max_norm/layer7": 12.572528839111328, "max_norm/layer8": 12.499512672424316, "max_norm/layer9": 12.626362800598145, "mean_norm": 8.62041107316812, "mean_norm/layer0": 8.445489645004272, "mean_norm/layer1": 8.477490961551666, "mean_norm/layer10": 8.626979351043701, "mean_norm/layer11": 8.683675706386566, "mean_norm/layer12": 8.732514381408691, "mean_norm/layer13": 8.567951917648315, "mean_norm/layer14": 8.662712216377258, "mean_norm/layer15": 8.731165051460266, "mean_norm/layer16": 8.571608543395996, "mean_norm/layer17": 8.684390306472778, "mean_norm/layer18": 8.562283277511597, "mean_norm/layer19": 8.563570141792297, "mean_norm/layer2": 8.239861786365509, "mean_norm/layer20": 8.617091238498688, "mean_norm/layer21": 8.609572529792786, "mean_norm/layer22": 8.809150457382202, "mean_norm/layer23": 8.823075652122498, "mean_norm/layer3": 8.756663084030151, "mean_norm/layer4": 8.528301894664764, "mean_norm/layer5": 9.021451652050018, "mean_norm/layer6": 8.404954314231873, "mean_norm/layer7": 8.530861616134644, "mean_norm/layer8": 8.623531699180603, "mean_norm/layer9": 8.61551833152771, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1350 }, { "epoch": 0.56, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4288744762576914, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 3.00097393989563, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8281, "eval_samples_per_second": 20.375, "eval_steps_per_second": 0.676, "step": 1350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.58, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0855, "max_norm": 12.768488883972168, "max_norm/layer0": 12.241242408752441, "max_norm/layer1": 12.424370765686035, "max_norm/layer10": 12.65182113647461, "max_norm/layer11": 12.119407653808594, "max_norm/layer12": 12.677779197692871, "max_norm/layer13": 12.085238456726074, "max_norm/layer14": 12.553781509399414, "max_norm/layer15": 12.58381175994873, "max_norm/layer16": 12.0853853225708, "max_norm/layer17": 12.551607131958008, "max_norm/layer18": 12.261463165283203, "max_norm/layer19": 12.205509185791016, "max_norm/layer2": 11.860236167907715, "max_norm/layer20": 12.388531684875488, "max_norm/layer21": 12.284324645996094, "max_norm/layer22": 12.768488883972168, "max_norm/layer23": 12.490804672241211, "max_norm/layer3": 12.376986503601074, "max_norm/layer4": 12.416421890258789, "max_norm/layer5": 12.763866424560547, "max_norm/layer6": 12.37830638885498, "max_norm/layer7": 12.686251640319824, "max_norm/layer8": 12.616026878356934, "max_norm/layer9": 12.709514617919922, "mean_norm": 8.642726625005404, "mean_norm/layer0": 8.45906376838684, "mean_norm/layer1": 8.49306035041809, "mean_norm/layer10": 8.64819061756134, "mean_norm/layer11": 8.707186877727509, "mean_norm/layer12": 8.760173201560974, "mean_norm/layer13": 8.58885395526886, "mean_norm/layer14": 8.687394678592682, "mean_norm/layer15": 8.758006572723389, "mean_norm/layer16": 8.593712091445923, "mean_norm/layer17": 8.711206674575806, "mean_norm/layer18": 8.585395872592926, "mean_norm/layer19": 8.587033748626709, "mean_norm/layer2": 8.246377110481262, "mean_norm/layer20": 8.6430304646492, "mean_norm/layer21": 8.633982956409454, "mean_norm/layer22": 8.84108155965805, "mean_norm/layer23": 8.853368699550629, "mean_norm/layer3": 8.7816281914711, "mean_norm/layer4": 8.544718623161316, "mean_norm/layer5": 9.056117296218872, "mean_norm/layer6": 8.417579352855682, "mean_norm/layer7": 8.547739028930664, "mean_norm/layer8": 8.644529163837433, "mean_norm/layer9": 8.636008143424988, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1400 }, { "epoch": 0.58, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.428842027557059, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.993396043777466, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5577, "eval_samples_per_second": 20.852, "eval_steps_per_second": 0.692, "step": 1400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.61, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.065, "max_norm": 12.911163330078125, "max_norm/layer0": 12.293036460876465, "max_norm/layer1": 12.547085762023926, "max_norm/layer10": 12.76215648651123, "max_norm/layer11": 12.25842571258545, "max_norm/layer12": 12.75853443145752, "max_norm/layer13": 12.15564250946045, "max_norm/layer14": 12.656801223754883, "max_norm/layer15": 12.706408500671387, "max_norm/layer16": 12.161219596862793, "max_norm/layer17": 12.7056245803833, "max_norm/layer18": 12.327484130859375, "max_norm/layer19": 12.249855995178223, "max_norm/layer2": 11.891606330871582, "max_norm/layer20": 12.475489616394043, "max_norm/layer21": 12.39600944519043, "max_norm/layer22": 12.857209205627441, "max_norm/layer23": 12.605290412902832, "max_norm/layer3": 12.465520858764648, "max_norm/layer4": 12.489715576171875, "max_norm/layer5": 12.911163330078125, "max_norm/layer6": 12.437993049621582, "max_norm/layer7": 12.785067558288574, "max_norm/layer8": 12.7163667678833, "max_norm/layer9": 12.821453094482422, "mean_norm": 8.664971977472305, "mean_norm/layer0": 8.472568154335022, "mean_norm/layer1": 8.508402287960052, "mean_norm/layer10": 8.669077575206757, "mean_norm/layer11": 8.730392575263977, "mean_norm/layer12": 8.787680089473724, "mean_norm/layer13": 8.609262645244598, "mean_norm/layer14": 8.711707293987274, "mean_norm/layer15": 8.78460282087326, "mean_norm/layer16": 8.616038620471954, "mean_norm/layer17": 8.738197267055511, "mean_norm/layer18": 8.608790636062622, "mean_norm/layer19": 8.610539197921753, "mean_norm/layer2": 8.253041744232178, "mean_norm/layer20": 8.669034600257874, "mean_norm/layer21": 8.65846562385559, "mean_norm/layer22": 8.872988402843475, "mean_norm/layer23": 8.883999526500702, "mean_norm/layer3": 8.80587100982666, "mean_norm/layer4": 8.561438500881195, "mean_norm/layer5": 9.091051876544952, "mean_norm/layer6": 8.430066585540771, "mean_norm/layer7": 8.564611732959747, "mean_norm/layer8": 8.66524201631546, "mean_norm/layer9": 8.656256675720215, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1450 }, { "epoch": 0.61, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4306429304421541, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.986873149871826, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5366, "eval_samples_per_second": 20.89, "eval_steps_per_second": 0.693, "step": 1450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.63, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0722, "max_norm": 13.059762001037598, "max_norm/layer0": 12.345417022705078, "max_norm/layer1": 12.659737586975098, "max_norm/layer10": 12.856481552124023, "max_norm/layer11": 12.383923530578613, "max_norm/layer12": 12.854155540466309, "max_norm/layer13": 12.24963665008545, "max_norm/layer14": 12.79176139831543, "max_norm/layer15": 12.82961368560791, "max_norm/layer16": 12.242087364196777, "max_norm/layer17": 12.827202796936035, "max_norm/layer18": 12.374549865722656, "max_norm/layer19": 12.30087661743164, "max_norm/layer2": 11.919795989990234, "max_norm/layer20": 12.611680030822754, "max_norm/layer21": 12.485276222229004, "max_norm/layer22": 12.907124519348145, "max_norm/layer23": 12.714141845703125, "max_norm/layer3": 12.535303115844727, "max_norm/layer4": 12.54542064666748, "max_norm/layer5": 13.059762001037598, "max_norm/layer6": 12.518970489501953, "max_norm/layer7": 12.897445678710938, "max_norm/layer8": 12.807401657104492, "max_norm/layer9": 12.903473854064941, "mean_norm": 8.68662746498982, "mean_norm/layer0": 8.48574846982956, "mean_norm/layer1": 8.523551344871521, "mean_norm/layer10": 8.689225196838379, "mean_norm/layer11": 8.753485918045044, "mean_norm/layer12": 8.814705193042755, "mean_norm/layer13": 8.629233002662659, "mean_norm/layer14": 8.735382556915283, "mean_norm/layer15": 8.810544908046722, "mean_norm/layer16": 8.637446343898773, "mean_norm/layer17": 8.764160871505737, "mean_norm/layer18": 8.63146036863327, "mean_norm/layer19": 8.63357812166214, "mean_norm/layer2": 8.259207248687744, "mean_norm/layer20": 8.694165408611298, "mean_norm/layer21": 8.681831121444702, "mean_norm/layer22": 8.90420150756836, "mean_norm/layer23": 8.914546489715576, "mean_norm/layer3": 8.829843997955322, "mean_norm/layer4": 8.577266812324524, "mean_norm/layer5": 9.12503045797348, "mean_norm/layer6": 8.442515015602112, "mean_norm/layer7": 8.580586612224579, "mean_norm/layer8": 8.685438334941864, "mean_norm/layer9": 8.675903856754303, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1500 }, { "epoch": 0.63, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4305942573912056, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9838168621063232, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5335, "eval_samples_per_second": 20.896, "eval_steps_per_second": 0.694, "step": 1500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.65, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0536, "max_norm": 13.204683303833008, "max_norm/layer0": 12.397311210632324, "max_norm/layer1": 12.771734237670898, "max_norm/layer10": 12.999382019042969, "max_norm/layer11": 12.556604385375977, "max_norm/layer12": 12.944580078125, "max_norm/layer13": 12.302048683166504, "max_norm/layer14": 12.901226043701172, "max_norm/layer15": 12.932552337646484, "max_norm/layer16": 12.336416244506836, "max_norm/layer17": 12.978598594665527, "max_norm/layer18": 12.42466926574707, "max_norm/layer19": 12.365293502807617, "max_norm/layer2": 11.952788352966309, "max_norm/layer20": 12.757342338562012, "max_norm/layer21": 12.583632469177246, "max_norm/layer22": 12.97545051574707, "max_norm/layer23": 12.805314064025879, "max_norm/layer3": 12.61535358428955, "max_norm/layer4": 12.621912956237793, "max_norm/layer5": 13.204683303833008, "max_norm/layer6": 12.58818531036377, "max_norm/layer7": 12.9867525100708, "max_norm/layer8": 12.903141021728516, "max_norm/layer9": 13.003826141357422, "mean_norm": 8.707863385478655, "mean_norm/layer0": 8.498963057994843, "mean_norm/layer1": 8.538367092609406, "mean_norm/layer10": 8.70906138420105, "mean_norm/layer11": 8.776423811912537, "mean_norm/layer12": 8.841421246528625, "mean_norm/layer13": 8.649191439151764, "mean_norm/layer14": 8.758762776851654, "mean_norm/layer15": 8.83595359325409, "mean_norm/layer16": 8.658472955226898, "mean_norm/layer17": 8.789756417274475, "mean_norm/layer18": 8.654428124427795, "mean_norm/layer19": 8.656601250171661, "mean_norm/layer2": 8.265197396278381, "mean_norm/layer20": 8.719094395637512, "mean_norm/layer21": 8.704816818237305, "mean_norm/layer22": 8.934785842895508, "mean_norm/layer23": 8.943950235843658, "mean_norm/layer3": 8.853420853614807, "mean_norm/layer4": 8.591943502426147, "mean_norm/layer5": 9.157538950443268, "mean_norm/layer6": 8.45427131652832, "mean_norm/layer7": 8.59613686800003, "mean_norm/layer8": 8.705270826816559, "mean_norm/layer9": 8.694891095161438, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1550 }, { "epoch": 0.65, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43009130253140426, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.982506036758423, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7956, "eval_samples_per_second": 20.431, "eval_steps_per_second": 0.678, "step": 1550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.67, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0505, "max_norm": 13.3615140914917, "max_norm/layer0": 12.517741203308105, "max_norm/layer1": 12.865513801574707, "max_norm/layer10": 13.127941131591797, "max_norm/layer11": 12.687420845031738, "max_norm/layer12": 13.030386924743652, "max_norm/layer13": 12.377881050109863, "max_norm/layer14": 13.030510902404785, "max_norm/layer15": 13.021608352661133, "max_norm/layer16": 12.415884971618652, "max_norm/layer17": 13.139957427978516, "max_norm/layer18": 12.48414134979248, "max_norm/layer19": 12.458990097045898, "max_norm/layer2": 11.990442276000977, "max_norm/layer20": 12.859320640563965, "max_norm/layer21": 12.669166564941406, "max_norm/layer22": 13.055481910705566, "max_norm/layer23": 12.907835006713867, "max_norm/layer3": 12.686458587646484, "max_norm/layer4": 12.707650184631348, "max_norm/layer5": 13.3615140914917, "max_norm/layer6": 12.65063190460205, "max_norm/layer7": 13.089656829833984, "max_norm/layer8": 13.009183883666992, "max_norm/layer9": 13.109399795532227, "mean_norm": 8.728878619770208, "mean_norm/layer0": 8.511847734451294, "mean_norm/layer1": 8.553039729595184, "mean_norm/layer10": 8.729139029979706, "mean_norm/layer11": 8.798815786838531, "mean_norm/layer12": 8.867528319358826, "mean_norm/layer13": 8.668808817863464, "mean_norm/layer14": 8.782176852226257, "mean_norm/layer15": 8.861507177352905, "mean_norm/layer16": 8.679296255111694, "mean_norm/layer17": 8.815626800060272, "mean_norm/layer18": 8.677160620689392, "mean_norm/layer19": 8.679296314716339, "mean_norm/layer2": 8.271026909351349, "mean_norm/layer20": 8.743983507156372, "mean_norm/layer21": 8.727519035339355, "mean_norm/layer22": 8.9653200507164, "mean_norm/layer23": 8.97294557094574, "mean_norm/layer3": 8.87597405910492, "mean_norm/layer4": 8.607149243354797, "mean_norm/layer5": 9.19001019001007, "mean_norm/layer6": 8.466087341308594, "mean_norm/layer7": 8.611168026924133, "mean_norm/layer8": 8.724406242370605, "mean_norm/layer9": 8.713253259658813, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1600 }, { "epoch": 0.67, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4306591547924703, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9796295166015625, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8191, "eval_samples_per_second": 20.391, "eval_steps_per_second": 0.677, "step": 1600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.69, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0475, "max_norm": 13.540763854980469, "max_norm/layer0": 12.632498741149902, "max_norm/layer1": 12.943493843078613, "max_norm/layer10": 13.258481979370117, "max_norm/layer11": 12.811452865600586, "max_norm/layer12": 13.11585807800293, "max_norm/layer13": 12.44717025756836, "max_norm/layer14": 13.164324760437012, "max_norm/layer15": 13.170096397399902, "max_norm/layer16": 12.488635063171387, "max_norm/layer17": 13.308391571044922, "max_norm/layer18": 12.548270225524902, "max_norm/layer19": 12.54361629486084, "max_norm/layer2": 12.023127555847168, "max_norm/layer20": 12.954742431640625, "max_norm/layer21": 12.747000694274902, "max_norm/layer22": 13.133721351623535, "max_norm/layer23": 13.020496368408203, "max_norm/layer3": 12.763312339782715, "max_norm/layer4": 12.796082496643066, "max_norm/layer5": 13.540763854980469, "max_norm/layer6": 12.707022666931152, "max_norm/layer7": 13.211490631103516, "max_norm/layer8": 13.115765571594238, "max_norm/layer9": 13.189752578735352, "mean_norm": 8.749427725871405, "mean_norm/layer0": 8.52438485622406, "mean_norm/layer1": 8.567584753036499, "mean_norm/layer10": 8.74834829568863, "mean_norm/layer11": 8.820571064949036, "mean_norm/layer12": 8.892871975898743, "mean_norm/layer13": 8.687913954257965, "mean_norm/layer14": 8.805040657520294, "mean_norm/layer15": 8.88647973537445, "mean_norm/layer16": 8.699283361434937, "mean_norm/layer17": 8.841068029403687, "mean_norm/layer18": 8.699337124824524, "mean_norm/layer19": 8.701597511768341, "mean_norm/layer2": 8.277015924453735, "mean_norm/layer20": 8.768545150756836, "mean_norm/layer21": 8.749671161174774, "mean_norm/layer22": 8.995070099830627, "mean_norm/layer23": 9.001830399036407, "mean_norm/layer3": 8.898363590240479, "mean_norm/layer4": 8.62207943201065, "mean_norm/layer5": 9.221762597560883, "mean_norm/layer6": 8.477177321910858, "mean_norm/layer7": 8.626116931438446, "mean_norm/layer8": 8.743105173110962, "mean_norm/layer9": 8.731046319007874, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1650 }, { "epoch": 0.69, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4328169933845212, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9699418544769287, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7962, "eval_samples_per_second": 20.43, "eval_steps_per_second": 0.678, "step": 1650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.71, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0322, "max_norm": 13.67343807220459, "max_norm/layer0": 12.717508316040039, "max_norm/layer1": 13.026078224182129, "max_norm/layer10": 13.373031616210938, "max_norm/layer11": 12.978168487548828, "max_norm/layer12": 13.207404136657715, "max_norm/layer13": 12.527669906616211, "max_norm/layer14": 13.306821823120117, "max_norm/layer15": 13.35703182220459, "max_norm/layer16": 12.5789155960083, "max_norm/layer17": 13.446418762207031, "max_norm/layer18": 12.62332534790039, "max_norm/layer19": 12.609963417053223, "max_norm/layer2": 12.068394660949707, "max_norm/layer20": 13.062036514282227, "max_norm/layer21": 12.836729049682617, "max_norm/layer22": 13.222061157226562, "max_norm/layer23": 13.132906913757324, "max_norm/layer3": 12.828428268432617, "max_norm/layer4": 12.867692947387695, "max_norm/layer5": 13.67343807220459, "max_norm/layer6": 12.808048248291016, "max_norm/layer7": 13.316970825195312, "max_norm/layer8": 13.244258880615234, "max_norm/layer9": 13.288371086120605, "mean_norm": 8.769363696376482, "mean_norm/layer0": 8.536643624305725, "mean_norm/layer1": 8.581710577011108, "mean_norm/layer10": 8.76716548204422, "mean_norm/layer11": 8.841660916805267, "mean_norm/layer12": 8.917559087276459, "mean_norm/layer13": 8.706561088562012, "mean_norm/layer14": 8.82697319984436, "mean_norm/layer15": 8.910794138908386, "mean_norm/layer16": 8.71890926361084, "mean_norm/layer17": 8.8657585978508, "mean_norm/layer18": 8.72101479768753, "mean_norm/layer19": 8.723503530025482, "mean_norm/layer2": 8.282784938812256, "mean_norm/layer20": 8.791405975818634, "mean_norm/layer21": 8.771677851676941, "mean_norm/layer22": 9.024154126644135, "mean_norm/layer23": 9.02972674369812, "mean_norm/layer3": 8.919883489608765, "mean_norm/layer4": 8.636090219020844, "mean_norm/layer5": 9.252493143081665, "mean_norm/layer6": 8.487660467624664, "mean_norm/layer7": 8.640743553638458, "mean_norm/layer8": 8.761323869228363, "mean_norm/layer9": 8.74853003025055, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1700 }, { "epoch": 0.71, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43344974304685185, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.96112060546875, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5347, "eval_samples_per_second": 20.893, "eval_steps_per_second": 0.694, "step": 1700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.73, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0316, "max_norm": 13.7894926071167, "max_norm/layer0": 12.797962188720703, "max_norm/layer1": 13.098018646240234, "max_norm/layer10": 13.477941513061523, "max_norm/layer11": 13.097651481628418, "max_norm/layer12": 13.281977653503418, "max_norm/layer13": 12.603769302368164, "max_norm/layer14": 13.395450592041016, "max_norm/layer15": 13.554838180541992, "max_norm/layer16": 12.664692878723145, "max_norm/layer17": 13.577613830566406, "max_norm/layer18": 12.694923400878906, "max_norm/layer19": 12.688633918762207, "max_norm/layer2": 12.093019485473633, "max_norm/layer20": 13.206803321838379, "max_norm/layer21": 12.924551010131836, "max_norm/layer22": 13.276300430297852, "max_norm/layer23": 13.243668556213379, "max_norm/layer3": 12.960731506347656, "max_norm/layer4": 12.94802188873291, "max_norm/layer5": 13.7894926071167, "max_norm/layer6": 12.89012622833252, "max_norm/layer7": 13.404141426086426, "max_norm/layer8": 13.369832038879395, "max_norm/layer9": 13.391281127929688, "mean_norm": 8.78863892952601, "mean_norm/layer0": 8.54848575592041, "mean_norm/layer1": 8.595603168010712, "mean_norm/layer10": 8.785156428813934, "mean_norm/layer11": 8.8616703748703, "mean_norm/layer12": 8.941543579101562, "mean_norm/layer13": 8.724583804607391, "mean_norm/layer14": 8.848139107227325, "mean_norm/layer15": 8.934328258037567, "mean_norm/layer16": 8.738065421581268, "mean_norm/layer17": 8.889622032642365, "mean_norm/layer18": 8.742164075374603, "mean_norm/layer19": 8.744739770889282, "mean_norm/layer2": 8.288312077522278, "mean_norm/layer20": 8.814082443714142, "mean_norm/layer21": 8.792964518070221, "mean_norm/layer22": 9.052066385746002, "mean_norm/layer23": 9.05666446685791, "mean_norm/layer3": 8.940515279769897, "mean_norm/layer4": 8.64976292848587, "mean_norm/layer5": 9.281967520713806, "mean_norm/layer6": 8.497880458831787, "mean_norm/layer7": 8.654960215091705, "mean_norm/layer8": 8.778730392456055, "mean_norm/layer9": 8.765325844287872, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1750 }, { "epoch": 0.73, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43388374441780947, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9500808715820312, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.803, "eval_samples_per_second": 20.419, "eval_steps_per_second": 0.678, "step": 1750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.75, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.02, "max_norm": 13.906452178955078, "max_norm/layer0": 12.882908821105957, "max_norm/layer1": 13.187368392944336, "max_norm/layer10": 13.588659286499023, "max_norm/layer11": 13.258871078491211, "max_norm/layer12": 13.408331871032715, "max_norm/layer13": 12.65833568572998, "max_norm/layer14": 13.496163368225098, "max_norm/layer15": 13.707235336303711, "max_norm/layer16": 12.777694702148438, "max_norm/layer17": 13.714956283569336, "max_norm/layer18": 12.791309356689453, "max_norm/layer19": 12.784247398376465, "max_norm/layer2": 12.128005027770996, "max_norm/layer20": 13.322413444519043, "max_norm/layer21": 13.02280330657959, "max_norm/layer22": 13.338006973266602, "max_norm/layer23": 13.346099853515625, "max_norm/layer3": 13.023100852966309, "max_norm/layer4": 13.038986206054688, "max_norm/layer5": 13.906452178955078, "max_norm/layer6": 13.03666877746582, "max_norm/layer7": 13.498882293701172, "max_norm/layer8": 13.546557426452637, "max_norm/layer9": 13.48300552368164, "mean_norm": 8.807754442095757, "mean_norm/layer0": 8.560234010219574, "mean_norm/layer1": 8.609053313732147, "mean_norm/layer10": 8.802674889564514, "mean_norm/layer11": 8.881379961967468, "mean_norm/layer12": 8.965039670467377, "mean_norm/layer13": 8.74233728647232, "mean_norm/layer14": 8.869293451309204, "mean_norm/layer15": 8.957258760929108, "mean_norm/layer16": 8.757313013076782, "mean_norm/layer17": 8.913440644741058, "mean_norm/layer18": 8.763157367706299, "mean_norm/layer19": 8.765839517116547, "mean_norm/layer2": 8.293516039848328, "mean_norm/layer20": 8.836040437221527, "mean_norm/layer21": 8.81434577703476, "mean_norm/layer22": 9.0809645652771, "mean_norm/layer23": 9.083868980407715, "mean_norm/layer3": 8.96069985628128, "mean_norm/layer4": 8.663160383701324, "mean_norm/layer5": 9.310991764068604, "mean_norm/layer6": 8.508190274238586, "mean_norm/layer7": 8.669151663780212, "mean_norm/layer8": 8.796195685863495, "mean_norm/layer9": 8.781959295272827, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1800 }, { "epoch": 0.75, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43465034497024857, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9467976093292236, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5398, "eval_samples_per_second": 20.884, "eval_steps_per_second": 0.693, "step": 1800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.77, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0245, "max_norm": 14.01785659790039, "max_norm/layer0": 12.971237182617188, "max_norm/layer1": 13.28554630279541, "max_norm/layer10": 13.687850952148438, "max_norm/layer11": 13.372243881225586, "max_norm/layer12": 13.521031379699707, "max_norm/layer13": 12.716824531555176, "max_norm/layer14": 13.601958274841309, "max_norm/layer15": 13.830903053283691, "max_norm/layer16": 12.890148162841797, "max_norm/layer17": 13.841341018676758, "max_norm/layer18": 12.844350814819336, "max_norm/layer19": 12.881791114807129, "max_norm/layer2": 12.16059398651123, "max_norm/layer20": 13.44249439239502, "max_norm/layer21": 13.136921882629395, "max_norm/layer22": 13.400025367736816, "max_norm/layer23": 13.452230453491211, "max_norm/layer3": 13.076272010803223, "max_norm/layer4": 13.150069236755371, "max_norm/layer5": 14.01785659790039, "max_norm/layer6": 13.116811752319336, "max_norm/layer7": 13.590741157531738, "max_norm/layer8": 13.703124046325684, "max_norm/layer9": 13.586084365844727, "mean_norm": 8.82675089687109, "mean_norm/layer0": 8.572085976600647, "mean_norm/layer1": 8.62241667509079, "mean_norm/layer10": 8.82029390335083, "mean_norm/layer11": 8.901059448719025, "mean_norm/layer12": 8.988628685474396, "mean_norm/layer13": 8.75994199514389, "mean_norm/layer14": 8.890415966510773, "mean_norm/layer15": 8.980129182338715, "mean_norm/layer16": 8.776431798934937, "mean_norm/layer17": 8.936899721622467, "mean_norm/layer18": 8.784013092517853, "mean_norm/layer19": 8.786966979503632, "mean_norm/layer2": 8.298439383506775, "mean_norm/layer20": 8.858497023582458, "mean_norm/layer21": 8.83534300327301, "mean_norm/layer22": 9.109531104564667, "mean_norm/layer23": 9.110761523246765, "mean_norm/layer3": 8.980851411819458, "mean_norm/layer4": 8.676248848438263, "mean_norm/layer5": 9.340028464794159, "mean_norm/layer6": 8.518348813056946, "mean_norm/layer7": 8.682745039463043, "mean_norm/layer8": 8.81353086233139, "mean_norm/layer9": 8.79841262102127, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1850 }, { "epoch": 0.77, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4355183477121638, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.940542697906494, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8237, "eval_samples_per_second": 20.383, "eval_steps_per_second": 0.677, "step": 1850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.79, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0247, "max_norm": 14.138656616210938, "max_norm/layer0": 13.052218437194824, "max_norm/layer1": 13.381721496582031, "max_norm/layer10": 13.791936874389648, "max_norm/layer11": 13.474544525146484, "max_norm/layer12": 13.667418479919434, "max_norm/layer13": 12.79587459564209, "max_norm/layer14": 13.703073501586914, "max_norm/layer15": 13.987411499023438, "max_norm/layer16": 12.992448806762695, "max_norm/layer17": 13.965337753295898, "max_norm/layer18": 12.948287010192871, "max_norm/layer19": 12.983268737792969, "max_norm/layer2": 12.176477432250977, "max_norm/layer20": 13.5822172164917, "max_norm/layer21": 13.263895034790039, "max_norm/layer22": 13.479641914367676, "max_norm/layer23": 13.553653717041016, "max_norm/layer3": 13.128030776977539, "max_norm/layer4": 13.215946197509766, "max_norm/layer5": 14.138656616210938, "max_norm/layer6": 13.19811725616455, "max_norm/layer7": 13.667899131774902, "max_norm/layer8": 13.788747787475586, "max_norm/layer9": 13.685811996459961, "mean_norm": 8.845184216896692, "mean_norm/layer0": 8.5836620926857, "mean_norm/layer1": 8.635238826274872, "mean_norm/layer10": 8.837403535842896, "mean_norm/layer11": 8.920144736766815, "mean_norm/layer12": 9.011907458305359, "mean_norm/layer13": 8.777201354503632, "mean_norm/layer14": 8.910749077796936, "mean_norm/layer15": 9.002386212348938, "mean_norm/layer16": 8.794780671596527, "mean_norm/layer17": 8.959879457950592, "mean_norm/layer18": 8.804102182388306, "mean_norm/layer19": 8.807617962360382, "mean_norm/layer2": 8.303315997123718, "mean_norm/layer20": 8.88015216588974, "mean_norm/layer21": 8.855957210063934, "mean_norm/layer22": 9.13687926530838, "mean_norm/layer23": 9.136677742004395, "mean_norm/layer3": 9.000433564186096, "mean_norm/layer4": 8.689013838768005, "mean_norm/layer5": 9.368463218212128, "mean_norm/layer6": 8.527889966964722, "mean_norm/layer7": 8.695912837982178, "mean_norm/layer8": 8.830221474170685, "mean_norm/layer9": 8.814430356025696, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1900 }, { "epoch": 0.79, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.436199770425443, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9340319633483887, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5963, "eval_samples_per_second": 20.782, "eval_steps_per_second": 0.69, "step": 1900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.81, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0201, "max_norm": 14.271653175354004, "max_norm/layer0": 13.13520622253418, "max_norm/layer1": 13.476064682006836, "max_norm/layer10": 13.901469230651855, "max_norm/layer11": 13.575247764587402, "max_norm/layer12": 13.7691650390625, "max_norm/layer13": 12.850029945373535, "max_norm/layer14": 13.810707092285156, "max_norm/layer15": 14.146288871765137, "max_norm/layer16": 13.090737342834473, "max_norm/layer17": 14.088882446289062, "max_norm/layer18": 13.102824211120605, "max_norm/layer19": 13.057214736938477, "max_norm/layer2": 12.24477767944336, "max_norm/layer20": 13.693897247314453, "max_norm/layer21": 13.370636940002441, "max_norm/layer22": 13.551177978515625, "max_norm/layer23": 13.672248840332031, "max_norm/layer3": 13.1995267868042, "max_norm/layer4": 13.299997329711914, "max_norm/layer5": 14.271653175354004, "max_norm/layer6": 13.269554138183594, "max_norm/layer7": 13.732311248779297, "max_norm/layer8": 13.88916015625, "max_norm/layer9": 13.77952766418457, "mean_norm": 8.863051029543081, "mean_norm/layer0": 8.594872176647186, "mean_norm/layer1": 8.648047864437103, "mean_norm/layer10": 8.853616833686829, "mean_norm/layer11": 8.938627779483795, "mean_norm/layer12": 9.034486055374146, "mean_norm/layer13": 8.793805718421936, "mean_norm/layer14": 8.930472075939178, "mean_norm/layer15": 9.02397906780243, "mean_norm/layer16": 8.81262332201004, "mean_norm/layer17": 8.982100486755371, "mean_norm/layer18": 8.823445796966553, "mean_norm/layer19": 8.827480673789978, "mean_norm/layer2": 8.308004558086395, "mean_norm/layer20": 8.901043772697449, "mean_norm/layer21": 8.875850260257721, "mean_norm/layer22": 9.163272619247437, "mean_norm/layer23": 9.16199541091919, "mean_norm/layer3": 9.019525945186615, "mean_norm/layer4": 8.701404392719269, "mean_norm/layer5": 9.396052300930023, "mean_norm/layer6": 8.537376403808594, "mean_norm/layer7": 8.708706319332123, "mean_norm/layer8": 8.846332848072052, "mean_norm/layer9": 8.830102026462555, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 1950 }, { "epoch": 0.81, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4370839975176744, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9285225868225098, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8013, "eval_samples_per_second": 20.421, "eval_steps_per_second": 0.678, "step": 1950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.84, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.0107, "max_norm": 14.383659362792969, "max_norm/layer0": 13.219470977783203, "max_norm/layer1": 13.575953483581543, "max_norm/layer10": 14.011261940002441, "max_norm/layer11": 13.69066333770752, "max_norm/layer12": 13.898682594299316, "max_norm/layer13": 12.897134780883789, "max_norm/layer14": 13.895804405212402, "max_norm/layer15": 14.285606384277344, "max_norm/layer16": 13.165793418884277, "max_norm/layer17": 14.2105712890625, "max_norm/layer18": 13.221928596496582, "max_norm/layer19": 13.153519630432129, "max_norm/layer2": 12.27010440826416, "max_norm/layer20": 13.807734489440918, "max_norm/layer21": 13.467498779296875, "max_norm/layer22": 13.61931324005127, "max_norm/layer23": 13.794743537902832, "max_norm/layer3": 13.270720481872559, "max_norm/layer4": 13.370405197143555, "max_norm/layer5": 14.383659362792969, "max_norm/layer6": 13.332939147949219, "max_norm/layer7": 13.822017669677734, "max_norm/layer8": 13.997716903686523, "max_norm/layer9": 13.877385139465332, "mean_norm": 8.880738290647665, "mean_norm/layer0": 8.60589337348938, "mean_norm/layer1": 8.660571813583374, "mean_norm/layer10": 8.86993956565857, "mean_norm/layer11": 8.956714928150177, "mean_norm/layer12": 9.056580424308777, "mean_norm/layer13": 8.810520350933075, "mean_norm/layer14": 8.950220763683319, "mean_norm/layer15": 9.045172274112701, "mean_norm/layer16": 8.83077585697174, "mean_norm/layer17": 9.004396915435791, "mean_norm/layer18": 8.842631757259369, "mean_norm/layer19": 8.847141087055206, "mean_norm/layer2": 8.312703967094421, "mean_norm/layer20": 8.92222511768341, "mean_norm/layer21": 8.895317256450653, "mean_norm/layer22": 9.189109563827515, "mean_norm/layer23": 9.187323927879333, "mean_norm/layer3": 9.038133919239044, "mean_norm/layer4": 8.713449716567993, "mean_norm/layer5": 9.423080027103424, "mean_norm/layer6": 8.546690106391907, "mean_norm/layer7": 8.72130572795868, "mean_norm/layer8": 8.862245798110962, "mean_norm/layer9": 8.845574736595154, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2000 }, { "epoch": 0.84, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43821158986464837, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9188804626464844, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7928, "eval_samples_per_second": 20.436, "eval_steps_per_second": 0.678, "step": 2000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.86, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 3.003, "max_norm": 14.526294708251953, "max_norm/layer0": 13.318120956420898, "max_norm/layer1": 13.691896438598633, "max_norm/layer10": 14.119477272033691, "max_norm/layer11": 13.802632331848145, "max_norm/layer12": 13.983503341674805, "max_norm/layer13": 12.947667121887207, "max_norm/layer14": 14.012450218200684, "max_norm/layer15": 14.473040580749512, "max_norm/layer16": 13.238360404968262, "max_norm/layer17": 14.329521179199219, "max_norm/layer18": 13.304075241088867, "max_norm/layer19": 13.220603942871094, "max_norm/layer2": 12.33705997467041, "max_norm/layer20": 13.91451358795166, "max_norm/layer21": 13.595061302185059, "max_norm/layer22": 13.679491996765137, "max_norm/layer23": 13.914533615112305, "max_norm/layer3": 13.341594696044922, "max_norm/layer4": 13.453817367553711, "max_norm/layer5": 14.526294708251953, "max_norm/layer6": 13.413007736206055, "max_norm/layer7": 13.901131629943848, "max_norm/layer8": 14.125232696533203, "max_norm/layer9": 13.965437889099121, "mean_norm": 8.898506715893745, "mean_norm/layer0": 8.61709862947464, "mean_norm/layer1": 8.673097789287567, "mean_norm/layer10": 8.886326968669891, "mean_norm/layer11": 8.975116968154907, "mean_norm/layer12": 9.078686237335205, "mean_norm/layer13": 8.826960861682892, "mean_norm/layer14": 8.969876110553741, "mean_norm/layer15": 9.066643118858337, "mean_norm/layer16": 8.848939836025238, "mean_norm/layer17": 9.026445209980011, "mean_norm/layer18": 8.862169206142426, "mean_norm/layer19": 8.867026507854462, "mean_norm/layer2": 8.317440271377563, "mean_norm/layer20": 8.943169057369232, "mean_norm/layer21": 8.91546756029129, "mean_norm/layer22": 9.215493023395538, "mean_norm/layer23": 9.21242493391037, "mean_norm/layer3": 9.056794881820679, "mean_norm/layer4": 8.725628674030304, "mean_norm/layer5": 9.450334191322327, "mean_norm/layer6": 8.556267082691193, "mean_norm/layer7": 8.733982026576996, "mean_norm/layer8": 8.878000140190125, "mean_norm/layer9": 8.860771894454956, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2050 }, { "epoch": 0.86, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43880377865118864, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.9210426807403564, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8044, "eval_samples_per_second": 20.416, "eval_steps_per_second": 0.678, "step": 2050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.88, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9918, "max_norm": 14.670685768127441, "max_norm/layer0": 13.415691375732422, "max_norm/layer1": 13.807945251464844, "max_norm/layer10": 14.238808631896973, "max_norm/layer11": 13.896550178527832, "max_norm/layer12": 14.093559265136719, "max_norm/layer13": 13.039774894714355, "max_norm/layer14": 14.146052360534668, "max_norm/layer15": 14.658995628356934, "max_norm/layer16": 13.320241928100586, "max_norm/layer17": 14.467944145202637, "max_norm/layer18": 13.421971321105957, "max_norm/layer19": 13.300816535949707, "max_norm/layer2": 12.368851661682129, "max_norm/layer20": 14.032940864562988, "max_norm/layer21": 13.714327812194824, "max_norm/layer22": 13.763936996459961, "max_norm/layer23": 14.012027740478516, "max_norm/layer3": 13.413012504577637, "max_norm/layer4": 13.571505546569824, "max_norm/layer5": 14.670685768127441, "max_norm/layer6": 13.480942726135254, "max_norm/layer7": 13.977544784545898, "max_norm/layer8": 14.206221580505371, "max_norm/layer9": 14.046436309814453, "mean_norm": 8.915782399475574, "mean_norm/layer0": 8.628024458885193, "mean_norm/layer1": 8.685210585594177, "mean_norm/layer10": 8.902346730232239, "mean_norm/layer11": 8.993071556091309, "mean_norm/layer12": 9.100186705589294, "mean_norm/layer13": 8.842869818210602, "mean_norm/layer14": 8.988996028900146, "mean_norm/layer15": 9.087421298027039, "mean_norm/layer16": 8.86632490158081, "mean_norm/layer17": 9.047946333885193, "mean_norm/layer18": 8.881589412689209, "mean_norm/layer19": 8.886434435844421, "mean_norm/layer2": 8.321897983551025, "mean_norm/layer20": 8.96368944644928, "mean_norm/layer21": 8.934747517108917, "mean_norm/layer22": 9.241970539093018, "mean_norm/layer23": 9.237237215042114, "mean_norm/layer3": 9.074563026428223, "mean_norm/layer4": 8.737144529819489, "mean_norm/layer5": 9.476523578166962, "mean_norm/layer6": 8.56508320569992, "mean_norm/layer7": 8.74627560377121, "mean_norm/layer8": 8.893504977226257, "mean_norm/layer9": 8.87571769952774, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2100 }, { "epoch": 0.88, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.43886867605245333, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.909998893737793, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7897, "eval_samples_per_second": 20.442, "eval_steps_per_second": 0.679, "step": 2100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.9, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9853, "max_norm": 14.838692665100098, "max_norm/layer0": 13.50354290008545, "max_norm/layer1": 13.911642074584961, "max_norm/layer10": 14.337469100952148, "max_norm/layer11": 13.996798515319824, "max_norm/layer12": 14.188272476196289, "max_norm/layer13": 13.153363227844238, "max_norm/layer14": 14.2456693649292, "max_norm/layer15": 14.81822681427002, "max_norm/layer16": 13.398094177246094, "max_norm/layer17": 14.58063793182373, "max_norm/layer18": 13.529489517211914, "max_norm/layer19": 13.36036491394043, "max_norm/layer2": 12.395270347595215, "max_norm/layer20": 14.136859893798828, "max_norm/layer21": 13.848156929016113, "max_norm/layer22": 13.873931884765625, "max_norm/layer23": 14.149714469909668, "max_norm/layer3": 13.486695289611816, "max_norm/layer4": 13.675530433654785, "max_norm/layer5": 14.838692665100098, "max_norm/layer6": 13.546252250671387, "max_norm/layer7": 14.067277908325195, "max_norm/layer8": 14.312942504882812, "max_norm/layer9": 14.15059757232666, "mean_norm": 8.9328340391318, "mean_norm/layer0": 8.638837158679962, "mean_norm/layer1": 8.69721806049347, "mean_norm/layer10": 8.91822373867035, "mean_norm/layer11": 9.010710537433624, "mean_norm/layer12": 9.121225714683533, "mean_norm/layer13": 8.85855746269226, "mean_norm/layer14": 9.007853507995605, "mean_norm/layer15": 9.107969760894775, "mean_norm/layer16": 8.883861780166626, "mean_norm/layer17": 9.06923532485962, "mean_norm/layer18": 8.90061503648758, "mean_norm/layer19": 8.905701696872711, "mean_norm/layer2": 8.326269209384918, "mean_norm/layer20": 8.983186781406403, "mean_norm/layer21": 8.953919172286987, "mean_norm/layer22": 9.268231928348541, "mean_norm/layer23": 9.26182246208191, "mean_norm/layer3": 9.09225046634674, "mean_norm/layer4": 8.748473942279816, "mean_norm/layer5": 9.502384603023529, "mean_norm/layer6": 8.573933243751526, "mean_norm/layer7": 8.758572161197662, "mean_norm/layer8": 8.908560156822205, "mean_norm/layer9": 8.890403032302856, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2150 }, { "epoch": 0.9, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4398867540347931, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.901756763458252, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8028, "eval_samples_per_second": 20.419, "eval_steps_per_second": 0.678, "step": 2150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.92, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9923, "max_norm": 14.992657661437988, "max_norm/layer0": 13.580909729003906, "max_norm/layer1": 14.019521713256836, "max_norm/layer10": 14.454727172851562, "max_norm/layer11": 14.117258071899414, "max_norm/layer12": 14.273975372314453, "max_norm/layer13": 13.259902000427246, "max_norm/layer14": 14.327220916748047, "max_norm/layer15": 14.929570198059082, "max_norm/layer16": 13.4490385055542, "max_norm/layer17": 14.68906021118164, "max_norm/layer18": 13.657282829284668, "max_norm/layer19": 13.454545974731445, "max_norm/layer2": 12.426871299743652, "max_norm/layer20": 14.252646446228027, "max_norm/layer21": 13.96719741821289, "max_norm/layer22": 14.019536018371582, "max_norm/layer23": 14.235506057739258, "max_norm/layer3": 13.598733901977539, "max_norm/layer4": 13.746255874633789, "max_norm/layer5": 14.992657661437988, "max_norm/layer6": 13.630704879760742, "max_norm/layer7": 14.18418025970459, "max_norm/layer8": 14.406624794006348, "max_norm/layer9": 14.30229377746582, "mean_norm": 8.949172087013721, "mean_norm/layer0": 8.649221539497375, "mean_norm/layer1": 8.708901345729828, "mean_norm/layer10": 8.93329781293869, "mean_norm/layer11": 9.027457654476166, "mean_norm/layer12": 9.141777276992798, "mean_norm/layer13": 8.873935222625732, "mean_norm/layer14": 9.02572363615036, "mean_norm/layer15": 9.127559781074524, "mean_norm/layer16": 8.90040373802185, "mean_norm/layer17": 9.089453399181366, "mean_norm/layer18": 8.918771147727966, "mean_norm/layer19": 8.924110770225525, "mean_norm/layer2": 8.330630600452423, "mean_norm/layer20": 9.002286434173584, "mean_norm/layer21": 8.972177803516388, "mean_norm/layer22": 9.292498588562012, "mean_norm/layer23": 9.28546392917633, "mean_norm/layer3": 9.109552025794983, "mean_norm/layer4": 8.759545028209686, "mean_norm/layer5": 9.527128338813782, "mean_norm/layer6": 8.582504987716675, "mean_norm/layer7": 8.770052433013916, "mean_norm/layer8": 8.923248827457428, "mean_norm/layer9": 8.904427766799927, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2200 }, { "epoch": 0.92, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4405722328356514, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.899564027786255, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7906, "eval_samples_per_second": 20.44, "eval_steps_per_second": 0.679, "step": 2200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.94, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9791, "max_norm": 15.16025447845459, "max_norm/layer0": 13.65170955657959, "max_norm/layer1": 14.106208801269531, "max_norm/layer10": 14.575181007385254, "max_norm/layer11": 14.219459533691406, "max_norm/layer12": 14.364925384521484, "max_norm/layer13": 13.383106231689453, "max_norm/layer14": 14.4501314163208, "max_norm/layer15": 14.990113258361816, "max_norm/layer16": 13.513087272644043, "max_norm/layer17": 14.812724113464355, "max_norm/layer18": 13.795426368713379, "max_norm/layer19": 13.57463264465332, "max_norm/layer2": 12.443663597106934, "max_norm/layer20": 14.366467475891113, "max_norm/layer21": 14.078028678894043, "max_norm/layer22": 14.125088691711426, "max_norm/layer23": 14.330960273742676, "max_norm/layer3": 13.687296867370605, "max_norm/layer4": 13.831295013427734, "max_norm/layer5": 15.16025447845459, "max_norm/layer6": 13.669600486755371, "max_norm/layer7": 14.281567573547363, "max_norm/layer8": 14.49099349975586, "max_norm/layer9": 14.393123626708984, "mean_norm": 8.96567795674006, "mean_norm/layer0": 8.65979665517807, "mean_norm/layer1": 8.720866560935974, "mean_norm/layer10": 8.948398649692535, "mean_norm/layer11": 9.044549465179443, "mean_norm/layer12": 9.16236698627472, "mean_norm/layer13": 8.88937371969223, "mean_norm/layer14": 9.043819427490234, "mean_norm/layer15": 9.147380352020264, "mean_norm/layer16": 8.91715395450592, "mean_norm/layer17": 9.10979026556015, "mean_norm/layer18": 8.93702483177185, "mean_norm/layer19": 8.943160235881805, "mean_norm/layer2": 8.334900140762329, "mean_norm/layer20": 9.021081447601318, "mean_norm/layer21": 8.991265833377838, "mean_norm/layer22": 9.317129492759705, "mean_norm/layer23": 9.309127569198608, "mean_norm/layer3": 9.127320051193237, "mean_norm/layer4": 8.770549535751343, "mean_norm/layer5": 9.552104949951172, "mean_norm/layer6": 8.59102463722229, "mean_norm/layer7": 8.781688511371613, "mean_norm/layer8": 8.938059091567993, "mean_norm/layer9": 8.918338596820831, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2250 }, { "epoch": 0.94, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4413428894756696, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.900628089904785, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8107, "eval_samples_per_second": 20.405, "eval_steps_per_second": 0.677, "step": 2250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.96, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9806, "max_norm": 15.3043851852417, "max_norm/layer0": 13.725802421569824, "max_norm/layer1": 14.185372352600098, "max_norm/layer10": 14.689973831176758, "max_norm/layer11": 14.349565505981445, "max_norm/layer12": 14.45600700378418, "max_norm/layer13": 13.499764442443848, "max_norm/layer14": 14.550609588623047, "max_norm/layer15": 15.10234546661377, "max_norm/layer16": 13.573525428771973, "max_norm/layer17": 14.938157081604004, "max_norm/layer18": 13.935149192810059, "max_norm/layer19": 13.665972709655762, "max_norm/layer2": 12.481348037719727, "max_norm/layer20": 14.470271110534668, "max_norm/layer21": 14.191650390625, "max_norm/layer22": 14.222891807556152, "max_norm/layer23": 14.447844505310059, "max_norm/layer3": 13.801197052001953, "max_norm/layer4": 13.936980247497559, "max_norm/layer5": 15.3043851852417, "max_norm/layer6": 13.723240852355957, "max_norm/layer7": 14.402823448181152, "max_norm/layer8": 14.585365295410156, "max_norm/layer9": 14.490229606628418, "mean_norm": 8.982164661089579, "mean_norm/layer0": 8.670240640640259, "mean_norm/layer1": 8.732674479484558, "mean_norm/layer10": 8.963507533073425, "mean_norm/layer11": 9.06149274110794, "mean_norm/layer12": 9.183135092258453, "mean_norm/layer13": 8.904652893543243, "mean_norm/layer14": 9.061905086040497, "mean_norm/layer15": 9.167264759540558, "mean_norm/layer16": 8.934041142463684, "mean_norm/layer17": 9.130063891410828, "mean_norm/layer18": 8.95542061328888, "mean_norm/layer19": 8.962070345878601, "mean_norm/layer2": 8.339269459247589, "mean_norm/layer20": 9.040118932723999, "mean_norm/layer21": 9.009513676166534, "mean_norm/layer22": 9.341909527778625, "mean_norm/layer23": 9.333087861537933, "mean_norm/layer3": 9.14510715007782, "mean_norm/layer4": 8.781482458114624, "mean_norm/layer5": 9.576900124549866, "mean_norm/layer6": 8.599566221237183, "mean_norm/layer7": 8.79344254732132, "mean_norm/layer8": 8.95266330242157, "mean_norm/layer9": 8.932421386241913, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2300 }, { "epoch": 0.96, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4420364804516859, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8937957286834717, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7988, "eval_samples_per_second": 20.426, "eval_steps_per_second": 0.678, "step": 2300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 0.98, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9658, "max_norm": 15.441264152526855, "max_norm/layer0": 13.801191329956055, "max_norm/layer1": 14.290616989135742, "max_norm/layer10": 14.793299674987793, "max_norm/layer11": 14.459893226623535, "max_norm/layer12": 14.546797752380371, "max_norm/layer13": 13.60170841217041, "max_norm/layer14": 14.642404556274414, "max_norm/layer15": 15.176553726196289, "max_norm/layer16": 13.654974937438965, "max_norm/layer17": 15.051509857177734, "max_norm/layer18": 14.04863166809082, "max_norm/layer19": 13.769092559814453, "max_norm/layer2": 12.504697799682617, "max_norm/layer20": 14.588030815124512, "max_norm/layer21": 14.302506446838379, "max_norm/layer22": 14.334789276123047, "max_norm/layer23": 14.561293601989746, "max_norm/layer3": 13.900928497314453, "max_norm/layer4": 14.038566589355469, "max_norm/layer5": 15.441264152526855, "max_norm/layer6": 13.786172866821289, "max_norm/layer7": 14.514456748962402, "max_norm/layer8": 14.683159828186035, "max_norm/layer9": 14.579593658447266, "mean_norm": 8.998664572834969, "mean_norm/layer0": 8.680808067321777, "mean_norm/layer1": 8.744622588157654, "mean_norm/layer10": 8.978585541248322, "mean_norm/layer11": 9.078620612621307, "mean_norm/layer12": 9.203763127326965, "mean_norm/layer13": 8.91998440027237, "mean_norm/layer14": 9.07971066236496, "mean_norm/layer15": 9.186996579170227, "mean_norm/layer16": 8.95055615901947, "mean_norm/layer17": 9.15077942609787, "mean_norm/layer18": 8.973953247070312, "mean_norm/layer19": 8.980820953845978, "mean_norm/layer2": 8.34368771314621, "mean_norm/layer20": 9.059822857379913, "mean_norm/layer21": 9.02804982662201, "mean_norm/layer22": 9.366870760917664, "mean_norm/layer23": 9.357110679149628, "mean_norm/layer3": 9.162328720092773, "mean_norm/layer4": 8.792425751686096, "mean_norm/layer5": 9.601547956466675, "mean_norm/layer6": 8.608037114143372, "mean_norm/layer7": 8.804958939552307, "mean_norm/layer8": 8.967408537864685, "mean_norm/layer9": 8.946499526500702, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2350 }, { "epoch": 0.98, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44169982518262535, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8900845050811768, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5515, "eval_samples_per_second": 20.863, "eval_steps_per_second": 0.693, "step": 2350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.0, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.9577, "max_norm": 15.574953079223633, "max_norm/layer0": 13.878785133361816, "max_norm/layer1": 14.37764835357666, "max_norm/layer10": 14.902111053466797, "max_norm/layer11": 14.557250022888184, "max_norm/layer12": 14.682308197021484, "max_norm/layer13": 13.673648834228516, "max_norm/layer14": 14.743877410888672, "max_norm/layer15": 15.239487648010254, "max_norm/layer16": 13.727298736572266, "max_norm/layer17": 15.168072700500488, "max_norm/layer18": 14.170589447021484, "max_norm/layer19": 13.88883113861084, "max_norm/layer2": 12.54202938079834, "max_norm/layer20": 14.685086250305176, "max_norm/layer21": 14.394617080688477, "max_norm/layer22": 14.45186710357666, "max_norm/layer23": 14.659900665283203, "max_norm/layer3": 13.987744331359863, "max_norm/layer4": 14.10349178314209, "max_norm/layer5": 15.574953079223633, "max_norm/layer6": 13.852619171142578, "max_norm/layer7": 14.626072883605957, "max_norm/layer8": 14.781867027282715, "max_norm/layer9": 14.68445110321045, "mean_norm": 9.014564402401447, "mean_norm/layer0": 8.691066265106201, "mean_norm/layer1": 8.756228804588318, "mean_norm/layer10": 8.993315815925598, "mean_norm/layer11": 9.095087945461273, "mean_norm/layer12": 9.223419189453125, "mean_norm/layer13": 8.934724807739258, "mean_norm/layer14": 9.097132921218872, "mean_norm/layer15": 9.206078290939331, "mean_norm/layer16": 8.96629410982132, "mean_norm/layer17": 9.170451998710632, "mean_norm/layer18": 8.991504669189453, "mean_norm/layer19": 8.998610973358154, "mean_norm/layer2": 8.347860455513, "mean_norm/layer20": 9.078348338603973, "mean_norm/layer21": 9.045956909656525, "mean_norm/layer22": 9.390547633171082, "mean_norm/layer23": 9.38027411699295, "mean_norm/layer3": 9.179291546344757, "mean_norm/layer4": 8.803498148918152, "mean_norm/layer5": 9.625588476657867, "mean_norm/layer6": 8.616418182849884, "mean_norm/layer7": 8.816068053245544, "mean_norm/layer8": 8.981455445289612, "mean_norm/layer9": 8.960322558879852, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2400 }, { "epoch": 1.0, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44255971574938247, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.885669231414795, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5534, "eval_samples_per_second": 20.86, "eval_steps_per_second": 0.692, "step": 2400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.02, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8357, "max_norm": 15.723752975463867, "max_norm/layer0": 13.947762489318848, "max_norm/layer1": 14.477116584777832, "max_norm/layer10": 15.02506160736084, "max_norm/layer11": 14.6520414352417, "max_norm/layer12": 14.819252014160156, "max_norm/layer13": 13.743169784545898, "max_norm/layer14": 14.834115982055664, "max_norm/layer15": 15.359285354614258, "max_norm/layer16": 13.801314353942871, "max_norm/layer17": 15.277505874633789, "max_norm/layer18": 14.275938034057617, "max_norm/layer19": 14.013418197631836, "max_norm/layer2": 12.606481552124023, "max_norm/layer20": 14.789701461791992, "max_norm/layer21": 14.507436752319336, "max_norm/layer22": 14.583073616027832, "max_norm/layer23": 14.75890827178955, "max_norm/layer3": 14.087556838989258, "max_norm/layer4": 14.228026390075684, "max_norm/layer5": 15.723752975463867, "max_norm/layer6": 13.925374984741211, "max_norm/layer7": 14.710521697998047, "max_norm/layer8": 14.911945343017578, "max_norm/layer9": 14.783496856689453, "mean_norm": 9.031480019291243, "mean_norm/layer0": 8.701723158359528, "mean_norm/layer1": 8.768332779407501, "mean_norm/layer10": 9.00841349363327, "mean_norm/layer11": 9.112366914749146, "mean_norm/layer12": 9.244458794593811, "mean_norm/layer13": 8.950533390045166, "mean_norm/layer14": 9.115843534469604, "mean_norm/layer15": 9.226688921451569, "mean_norm/layer16": 8.983336091041565, "mean_norm/layer17": 9.191466331481934, "mean_norm/layer18": 9.01020735502243, "mean_norm/layer19": 9.017823576927185, "mean_norm/layer2": 8.352315068244934, "mean_norm/layer20": 9.098797261714935, "mean_norm/layer21": 9.06588214635849, "mean_norm/layer22": 9.41590791940689, "mean_norm/layer23": 9.405222654342651, "mean_norm/layer3": 9.196974635124207, "mean_norm/layer4": 8.814748108386993, "mean_norm/layer5": 9.65069442987442, "mean_norm/layer6": 8.625239789485931, "mean_norm/layer7": 8.827593207359314, "mean_norm/layer8": 8.996190905570984, "mean_norm/layer9": 8.974759995937347, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2450 }, { "epoch": 1.02, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44219061177968955, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.891197443008423, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7944, "eval_samples_per_second": 20.433, "eval_steps_per_second": 0.678, "step": 2450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.04, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8427, "max_norm": 15.870335578918457, "max_norm/layer0": 14.013547897338867, "max_norm/layer1": 14.573381423950195, "max_norm/layer10": 15.130743026733398, "max_norm/layer11": 14.750649452209473, "max_norm/layer12": 14.940457344055176, "max_norm/layer13": 13.85982894897461, "max_norm/layer14": 14.928179740905762, "max_norm/layer15": 15.517732620239258, "max_norm/layer16": 13.898526191711426, "max_norm/layer17": 15.39119815826416, "max_norm/layer18": 14.368980407714844, "max_norm/layer19": 14.072687149047852, "max_norm/layer2": 12.69582748413086, "max_norm/layer20": 14.895695686340332, "max_norm/layer21": 14.618597030639648, "max_norm/layer22": 14.678531646728516, "max_norm/layer23": 14.874917030334473, "max_norm/layer3": 14.15068244934082, "max_norm/layer4": 14.324492454528809, "max_norm/layer5": 15.870335578918457, "max_norm/layer6": 13.982853889465332, "max_norm/layer7": 14.777878761291504, "max_norm/layer8": 15.033072471618652, "max_norm/layer9": 14.886922836303711, "mean_norm": 9.048154046138128, "mean_norm/layer0": 8.712783455848694, "mean_norm/layer1": 8.780392825603485, "mean_norm/layer10": 9.02328896522522, "mean_norm/layer11": 9.129519879817963, "mean_norm/layer12": 9.265049755573273, "mean_norm/layer13": 8.966003775596619, "mean_norm/layer14": 9.13392037153244, "mean_norm/layer15": 9.246784627437592, "mean_norm/layer16": 8.9999498128891, "mean_norm/layer17": 9.212452232837677, "mean_norm/layer18": 9.028715074062347, "mean_norm/layer19": 9.0364351272583, "mean_norm/layer2": 8.356776595115662, "mean_norm/layer20": 9.11862301826477, "mean_norm/layer21": 9.0850949883461, "mean_norm/layer22": 9.4408740401268, "mean_norm/layer23": 9.429868519306183, "mean_norm/layer3": 9.214716017246246, "mean_norm/layer4": 8.826160609722137, "mean_norm/layer5": 9.675524532794952, "mean_norm/layer6": 8.633809804916382, "mean_norm/layer7": 8.83916038274765, "mean_norm/layer8": 9.010636866092682, "mean_norm/layer9": 8.98915582895279, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2500 }, { "epoch": 1.04, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4415984229931493, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8902156352996826, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8087, "eval_samples_per_second": 20.409, "eval_steps_per_second": 0.677, "step": 2500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.06, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8524, "max_norm": 16.009868621826172, "max_norm/layer0": 14.078265190124512, "max_norm/layer1": 14.670526504516602, "max_norm/layer10": 15.227030754089355, "max_norm/layer11": 14.859092712402344, "max_norm/layer12": 15.091114044189453, "max_norm/layer13": 13.921088218688965, "max_norm/layer14": 15.035015106201172, "max_norm/layer15": 15.675447463989258, "max_norm/layer16": 14.004446983337402, "max_norm/layer17": 15.502359390258789, "max_norm/layer18": 14.5051851272583, "max_norm/layer19": 14.167274475097656, "max_norm/layer2": 12.767056465148926, "max_norm/layer20": 15.009303092956543, "max_norm/layer21": 14.740386009216309, "max_norm/layer22": 14.763566970825195, "max_norm/layer23": 14.968628883361816, "max_norm/layer3": 14.237839698791504, "max_norm/layer4": 14.436867713928223, "max_norm/layer5": 16.009868621826172, "max_norm/layer6": 14.039834022521973, "max_norm/layer7": 14.868507385253906, "max_norm/layer8": 15.15004825592041, "max_norm/layer9": 14.995036125183105, "mean_norm": 9.064850961168608, "mean_norm/layer0": 8.724150776863098, "mean_norm/layer1": 8.792477667331696, "mean_norm/layer10": 9.038262903690338, "mean_norm/layer11": 9.146433353424072, "mean_norm/layer12": 9.2858447432518, "mean_norm/layer13": 8.981484949588776, "mean_norm/layer14": 9.152089536190033, "mean_norm/layer15": 9.266744434833527, "mean_norm/layer16": 9.016795575618744, "mean_norm/layer17": 9.233408987522125, "mean_norm/layer18": 9.046853363513947, "mean_norm/layer19": 9.05537211894989, "mean_norm/layer2": 8.361333727836609, "mean_norm/layer20": 9.13805490732193, "mean_norm/layer21": 9.10432755947113, "mean_norm/layer22": 9.466131627559662, "mean_norm/layer23": 9.454012274742126, "mean_norm/layer3": 9.232695639133453, "mean_norm/layer4": 8.837390780448914, "mean_norm/layer5": 9.700556099414825, "mean_norm/layer6": 8.642646074295044, "mean_norm/layer7": 8.850711584091187, "mean_norm/layer8": 9.025233507156372, "mean_norm/layer9": 9.003410875797272, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2550 }, { "epoch": 1.06, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4432127458496084, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.883772850036621, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.774, "eval_samples_per_second": 20.469, "eval_steps_per_second": 0.679, "step": 2550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.09, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8441, "max_norm": 16.144901275634766, "max_norm/layer0": 14.166998863220215, "max_norm/layer1": 14.77054500579834, "max_norm/layer10": 15.321858406066895, "max_norm/layer11": 14.944963455200195, "max_norm/layer12": 15.217597007751465, "max_norm/layer13": 13.982170104980469, "max_norm/layer14": 15.154606819152832, "max_norm/layer15": 15.824800491333008, "max_norm/layer16": 14.139287948608398, "max_norm/layer17": 15.600570678710938, "max_norm/layer18": 14.64634895324707, "max_norm/layer19": 14.26150894165039, "max_norm/layer2": 12.838845252990723, "max_norm/layer20": 15.12016487121582, "max_norm/layer21": 14.849102973937988, "max_norm/layer22": 14.883748054504395, "max_norm/layer23": 15.04641342163086, "max_norm/layer3": 14.34477710723877, "max_norm/layer4": 14.549644470214844, "max_norm/layer5": 16.144901275634766, "max_norm/layer6": 14.10580062866211, "max_norm/layer7": 14.937480926513672, "max_norm/layer8": 15.275439262390137, "max_norm/layer9": 15.114044189453125, "mean_norm": 9.081460249920687, "mean_norm/layer0": 8.735827803611755, "mean_norm/layer1": 8.804422497749329, "mean_norm/layer10": 9.052965462207794, "mean_norm/layer11": 9.16351443529129, "mean_norm/layer12": 9.306387066841125, "mean_norm/layer13": 8.996783316135406, "mean_norm/layer14": 9.170424222946167, "mean_norm/layer15": 9.286848545074463, "mean_norm/layer16": 9.033456265926361, "mean_norm/layer17": 9.253972351551056, "mean_norm/layer18": 9.065014839172363, "mean_norm/layer19": 9.074174404144287, "mean_norm/layer2": 8.366111278533936, "mean_norm/layer20": 9.157218277454376, "mean_norm/layer21": 9.12339198589325, "mean_norm/layer22": 9.491381049156189, "mean_norm/layer23": 9.47799527645111, "mean_norm/layer3": 9.250598967075348, "mean_norm/layer4": 8.848586916923523, "mean_norm/layer5": 9.725355744361877, "mean_norm/layer6": 8.651413083076477, "mean_norm/layer7": 8.862074136734009, "mean_norm/layer8": 9.039798736572266, "mean_norm/layer9": 9.017329335212708, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2600 }, { "epoch": 1.09, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4437805981106744, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8798539638519287, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7931, "eval_samples_per_second": 20.436, "eval_steps_per_second": 0.678, "step": 2600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.11, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8597, "max_norm": 16.280908584594727, "max_norm/layer0": 14.25904369354248, "max_norm/layer1": 14.876733779907227, "max_norm/layer10": 15.432615280151367, "max_norm/layer11": 15.070473670959473, "max_norm/layer12": 15.340192794799805, "max_norm/layer13": 14.053213119506836, "max_norm/layer14": 15.254984855651855, "max_norm/layer15": 15.967584609985352, "max_norm/layer16": 14.240683555603027, "max_norm/layer17": 15.71219253540039, "max_norm/layer18": 14.776082992553711, "max_norm/layer19": 14.346572875976562, "max_norm/layer2": 12.922161102294922, "max_norm/layer20": 15.224787712097168, "max_norm/layer21": 14.95941162109375, "max_norm/layer22": 15.001152038574219, "max_norm/layer23": 15.122055053710938, "max_norm/layer3": 14.454421997070312, "max_norm/layer4": 14.653867721557617, "max_norm/layer5": 16.280908584594727, "max_norm/layer6": 14.169611930847168, "max_norm/layer7": 15.036980628967285, "max_norm/layer8": 15.427152633666992, "max_norm/layer9": 15.218523025512695, "mean_norm": 9.097782894968987, "mean_norm/layer0": 8.747545421123505, "mean_norm/layer1": 8.816453874111176, "mean_norm/layer10": 9.067423224449158, "mean_norm/layer11": 9.180491149425507, "mean_norm/layer12": 9.326535284519196, "mean_norm/layer13": 9.011679291725159, "mean_norm/layer14": 9.18821370601654, "mean_norm/layer15": 9.306611061096191, "mean_norm/layer16": 9.050126194953918, "mean_norm/layer17": 9.274332463741302, "mean_norm/layer18": 9.083183467388153, "mean_norm/layer19": 9.092769265174866, "mean_norm/layer2": 8.370811522006989, "mean_norm/layer20": 9.176023662090302, "mean_norm/layer21": 9.141830861568451, "mean_norm/layer22": 9.516046524047852, "mean_norm/layer23": 9.501545190811157, "mean_norm/layer3": 9.268109500408173, "mean_norm/layer4": 8.859676361083984, "mean_norm/layer5": 9.749540209770203, "mean_norm/layer6": 8.65969580411911, "mean_norm/layer7": 8.873176157474518, "mean_norm/layer8": 9.053912878036499, "mean_norm/layer9": 9.03105640411377, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2650 }, { "epoch": 1.11, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4426530057637004, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.882810115814209, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7841, "eval_samples_per_second": 20.451, "eval_steps_per_second": 0.679, "step": 2650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.13, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8523, "max_norm": 16.419876098632812, "max_norm/layer0": 14.34637451171875, "max_norm/layer1": 14.984748840332031, "max_norm/layer10": 15.536199569702148, "max_norm/layer11": 15.177663803100586, "max_norm/layer12": 15.445916175842285, "max_norm/layer13": 14.101208686828613, "max_norm/layer14": 15.343002319335938, "max_norm/layer15": 16.075366973876953, "max_norm/layer16": 14.350403785705566, "max_norm/layer17": 15.8396577835083, "max_norm/layer18": 14.874992370605469, "max_norm/layer19": 14.431367874145508, "max_norm/layer2": 13.012994766235352, "max_norm/layer20": 15.345575332641602, "max_norm/layer21": 15.066669464111328, "max_norm/layer22": 15.1093111038208, "max_norm/layer23": 15.202255249023438, "max_norm/layer3": 14.54269790649414, "max_norm/layer4": 14.769430160522461, "max_norm/layer5": 16.419876098632812, "max_norm/layer6": 14.223309516906738, "max_norm/layer7": 15.136229515075684, "max_norm/layer8": 15.555449485778809, "max_norm/layer9": 15.360017776489258, "mean_norm": 9.113588072359562, "mean_norm/layer0": 8.759117603302002, "mean_norm/layer1": 8.828328490257263, "mean_norm/layer10": 9.081544935703278, "mean_norm/layer11": 9.196539223194122, "mean_norm/layer12": 9.34596437215805, "mean_norm/layer13": 9.026325702667236, "mean_norm/layer14": 9.20580768585205, "mean_norm/layer15": 9.325709998607635, "mean_norm/layer16": 9.066176950931549, "mean_norm/layer17": 9.293815612792969, "mean_norm/layer18": 9.100383222103119, "mean_norm/layer19": 9.110606670379639, "mean_norm/layer2": 8.375436842441559, "mean_norm/layer20": 9.194181025028229, "mean_norm/layer21": 9.159276247024536, "mean_norm/layer22": 9.539666295051575, "mean_norm/layer23": 9.524423122406006, "mean_norm/layer3": 9.285327970981598, "mean_norm/layer4": 8.870383977890015, "mean_norm/layer5": 9.77319449186325, "mean_norm/layer6": 8.667758345603943, "mean_norm/layer7": 8.884088516235352, "mean_norm/layer8": 9.067574143409729, "mean_norm/layer9": 9.044482290744781, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2700 }, { "epoch": 1.13, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.443082951047079, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.877031087875366, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8014, "eval_samples_per_second": 20.421, "eval_steps_per_second": 0.678, "step": 2700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.15, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8622, "max_norm": 16.557350158691406, "max_norm/layer0": 14.418149948120117, "max_norm/layer1": 15.097500801086426, "max_norm/layer10": 15.643484115600586, "max_norm/layer11": 15.281368255615234, "max_norm/layer12": 15.568787574768066, "max_norm/layer13": 14.152594566345215, "max_norm/layer14": 15.426847457885742, "max_norm/layer15": 16.16790199279785, "max_norm/layer16": 14.4529447555542, "max_norm/layer17": 15.965700149536133, "max_norm/layer18": 15.009598731994629, "max_norm/layer19": 14.541038513183594, "max_norm/layer2": 13.10386848449707, "max_norm/layer20": 15.445903778076172, "max_norm/layer21": 15.171789169311523, "max_norm/layer22": 15.222389221191406, "max_norm/layer23": 15.312973976135254, "max_norm/layer3": 14.611842155456543, "max_norm/layer4": 14.887364387512207, "max_norm/layer5": 16.557350158691406, "max_norm/layer6": 14.284734725952148, "max_norm/layer7": 15.256564140319824, "max_norm/layer8": 15.690933227539062, "max_norm/layer9": 15.485148429870605, "mean_norm": 9.129469233254591, "mean_norm/layer0": 8.77081549167633, "mean_norm/layer1": 8.84003496170044, "mean_norm/layer10": 9.095685243606567, "mean_norm/layer11": 9.2125763297081, "mean_norm/layer12": 9.365703403949738, "mean_norm/layer13": 9.041068434715271, "mean_norm/layer14": 9.223137736320496, "mean_norm/layer15": 9.344794929027557, "mean_norm/layer16": 9.082189679145813, "mean_norm/layer17": 9.313395082950592, "mean_norm/layer18": 9.11777526140213, "mean_norm/layer19": 9.128398835659027, "mean_norm/layer2": 8.379985272884369, "mean_norm/layer20": 9.213001072406769, "mean_norm/layer21": 9.177213549613953, "mean_norm/layer22": 9.56313019990921, "mean_norm/layer23": 9.547671377658844, "mean_norm/layer3": 9.302635192871094, "mean_norm/layer4": 8.881201982498169, "mean_norm/layer5": 9.797004163265228, "mean_norm/layer6": 8.67586863040924, "mean_norm/layer7": 8.894869089126587, "mean_norm/layer8": 9.081298410892487, "mean_norm/layer9": 9.057807266712189, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2750 }, { "epoch": 1.15, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4445593669258507, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8714001178741455, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7901, "eval_samples_per_second": 20.441, "eval_steps_per_second": 0.679, "step": 2750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.17, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.864, "max_norm": 16.692607879638672, "max_norm/layer0": 14.486806869506836, "max_norm/layer1": 15.20768928527832, "max_norm/layer10": 15.750007629394531, "max_norm/layer11": 15.358442306518555, "max_norm/layer12": 15.6708984375, "max_norm/layer13": 14.241842269897461, "max_norm/layer14": 15.518338203430176, "max_norm/layer15": 16.292762756347656, "max_norm/layer16": 14.54626750946045, "max_norm/layer17": 16.069358825683594, "max_norm/layer18": 15.13725757598877, "max_norm/layer19": 14.667492866516113, "max_norm/layer2": 13.187070846557617, "max_norm/layer20": 15.576197624206543, "max_norm/layer21": 15.274862289428711, "max_norm/layer22": 15.325810432434082, "max_norm/layer23": 15.413392066955566, "max_norm/layer3": 14.685466766357422, "max_norm/layer4": 14.984869003295898, "max_norm/layer5": 16.692607879638672, "max_norm/layer6": 14.32935619354248, "max_norm/layer7": 15.362448692321777, "max_norm/layer8": 15.82071304321289, "max_norm/layer9": 15.565882682800293, "mean_norm": 9.145023641486963, "mean_norm/layer0": 8.78237795829773, "mean_norm/layer1": 8.851688504219055, "mean_norm/layer10": 9.109631359577179, "mean_norm/layer11": 9.228287041187286, "mean_norm/layer12": 9.385038435459137, "mean_norm/layer13": 9.055398046970367, "mean_norm/layer14": 9.239995121955872, "mean_norm/layer15": 9.363190233707428, "mean_norm/layer16": 9.097616195678711, "mean_norm/layer17": 9.332431018352509, "mean_norm/layer18": 9.135051906108856, "mean_norm/layer19": 9.145816683769226, "mean_norm/layer2": 8.38431704044342, "mean_norm/layer20": 9.23117482662201, "mean_norm/layer21": 9.19452828168869, "mean_norm/layer22": 9.586361765861511, "mean_norm/layer23": 9.570209264755249, "mean_norm/layer3": 9.319473028182983, "mean_norm/layer4": 8.891644835472107, "mean_norm/layer5": 9.820540606975555, "mean_norm/layer6": 8.68411499261856, "mean_norm/layer7": 8.905657947063446, "mean_norm/layer8": 9.094788134098053, "mean_norm/layer9": 9.071234166622162, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2800 }, { "epoch": 1.17, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4445796473637459, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.873532295227051, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8068, "eval_samples_per_second": 20.412, "eval_steps_per_second": 0.678, "step": 2800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.19, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8527, "max_norm": 16.828922271728516, "max_norm/layer0": 14.584033012390137, "max_norm/layer1": 15.336833000183105, "max_norm/layer10": 15.875840187072754, "max_norm/layer11": 15.442821502685547, "max_norm/layer12": 15.754557609558105, "max_norm/layer13": 14.32339096069336, "max_norm/layer14": 15.597060203552246, "max_norm/layer15": 16.412872314453125, "max_norm/layer16": 14.650659561157227, "max_norm/layer17": 16.20420265197754, "max_norm/layer18": 15.219154357910156, "max_norm/layer19": 14.83084774017334, "max_norm/layer2": 13.268367767333984, "max_norm/layer20": 15.677299499511719, "max_norm/layer21": 15.406458854675293, "max_norm/layer22": 15.44321060180664, "max_norm/layer23": 15.511178016662598, "max_norm/layer3": 14.764835357666016, "max_norm/layer4": 15.09919548034668, "max_norm/layer5": 16.828922271728516, "max_norm/layer6": 14.383938789367676, "max_norm/layer7": 15.485296249389648, "max_norm/layer8": 15.941476821899414, "max_norm/layer9": 15.665557861328125, "mean_norm": 9.160597927868366, "mean_norm/layer0": 8.794089376926422, "mean_norm/layer1": 8.863369762897491, "mean_norm/layer10": 9.12364000082016, "mean_norm/layer11": 9.244284212589264, "mean_norm/layer12": 9.404542028903961, "mean_norm/layer13": 9.069941818714142, "mean_norm/layer14": 9.256960809230804, "mean_norm/layer15": 9.381789445877075, "mean_norm/layer16": 9.113153159618378, "mean_norm/layer17": 9.35132884979248, "mean_norm/layer18": 9.151803016662598, "mean_norm/layer19": 9.163000464439392, "mean_norm/layer2": 8.388769388198853, "mean_norm/layer20": 9.248739957809448, "mean_norm/layer21": 9.21191132068634, "mean_norm/layer22": 9.609494626522064, "mean_norm/layer23": 9.593034207820892, "mean_norm/layer3": 9.33625191450119, "mean_norm/layer4": 8.902081072330475, "mean_norm/layer5": 9.844298720359802, "mean_norm/layer6": 8.692344605922699, "mean_norm/layer7": 8.916409969329834, "mean_norm/layer8": 9.108461380004883, "mean_norm/layer9": 9.084650158882141, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2850 }, { "epoch": 1.19, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44370758853425163, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8756139278411865, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8326, "eval_samples_per_second": 20.368, "eval_steps_per_second": 0.676, "step": 2850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.21, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8409, "max_norm": 16.954225540161133, "max_norm/layer0": 14.67629623413086, "max_norm/layer1": 15.439681053161621, "max_norm/layer10": 15.993009567260742, "max_norm/layer11": 15.52728271484375, "max_norm/layer12": 15.852997779846191, "max_norm/layer13": 14.400331497192383, "max_norm/layer14": 15.702228546142578, "max_norm/layer15": 16.554004669189453, "max_norm/layer16": 14.767534255981445, "max_norm/layer17": 16.32081413269043, "max_norm/layer18": 15.322539329528809, "max_norm/layer19": 14.932204246520996, "max_norm/layer2": 13.33304214477539, "max_norm/layer20": 15.784565925598145, "max_norm/layer21": 15.512778282165527, "max_norm/layer22": 15.573765754699707, "max_norm/layer23": 15.618204116821289, "max_norm/layer3": 14.863533973693848, "max_norm/layer4": 15.184027671813965, "max_norm/layer5": 16.954225540161133, "max_norm/layer6": 14.433019638061523, "max_norm/layer7": 15.593091011047363, "max_norm/layer8": 16.040678024291992, "max_norm/layer9": 15.799813270568848, "mean_norm": 9.175687476992607, "mean_norm/layer0": 8.805468738079071, "mean_norm/layer1": 8.874761521816254, "mean_norm/layer10": 9.137395858764648, "mean_norm/layer11": 9.259815275669098, "mean_norm/layer12": 9.423438429832458, "mean_norm/layer13": 9.08407998085022, "mean_norm/layer14": 9.273297250270844, "mean_norm/layer15": 9.399744391441345, "mean_norm/layer16": 9.12816721200943, "mean_norm/layer17": 9.369861721992493, "mean_norm/layer18": 9.168180584907532, "mean_norm/layer19": 9.179289519786835, "mean_norm/layer2": 8.39303857088089, "mean_norm/layer20": 9.265758633613586, "mean_norm/layer21": 9.228505730628967, "mean_norm/layer22": 9.631839513778687, "mean_norm/layer23": 9.615257382392883, "mean_norm/layer3": 9.35254430770874, "mean_norm/layer4": 8.912357032299042, "mean_norm/layer5": 9.867339313030243, "mean_norm/layer6": 8.700405836105347, "mean_norm/layer7": 8.926807165145874, "mean_norm/layer8": 9.121643006801605, "mean_norm/layer9": 9.09750247001648, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2900 }, { "epoch": 1.21, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44484329305638365, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8662402629852295, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5382, "eval_samples_per_second": 20.887, "eval_steps_per_second": 0.693, "step": 2900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.23, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8535, "max_norm": 17.074094772338867, "max_norm/layer0": 14.771538734436035, "max_norm/layer1": 15.542774200439453, "max_norm/layer10": 16.1263370513916, "max_norm/layer11": 15.602151870727539, "max_norm/layer12": 15.966864585876465, "max_norm/layer13": 14.503449440002441, "max_norm/layer14": 15.782112121582031, "max_norm/layer15": 16.67736053466797, "max_norm/layer16": 14.884428977966309, "max_norm/layer17": 16.445512771606445, "max_norm/layer18": 15.415112495422363, "max_norm/layer19": 15.022063255310059, "max_norm/layer2": 13.403141021728516, "max_norm/layer20": 15.920245170593262, "max_norm/layer21": 15.62589168548584, "max_norm/layer22": 15.720357894897461, "max_norm/layer23": 15.716158866882324, "max_norm/layer3": 14.941350936889648, "max_norm/layer4": 15.257119178771973, "max_norm/layer5": 17.074094772338867, "max_norm/layer6": 14.491571426391602, "max_norm/layer7": 15.718575477600098, "max_norm/layer8": 16.172351837158203, "max_norm/layer9": 15.940131187438965, "mean_norm": 9.190696770946184, "mean_norm/layer0": 8.816956281661987, "mean_norm/layer1": 8.88613373041153, "mean_norm/layer10": 9.150634229183197, "mean_norm/layer11": 9.275252103805542, "mean_norm/layer12": 9.442244589328766, "mean_norm/layer13": 9.098045706748962, "mean_norm/layer14": 9.289654433727264, "mean_norm/layer15": 9.417704820632935, "mean_norm/layer16": 9.143186032772064, "mean_norm/layer17": 9.388283371925354, "mean_norm/layer18": 9.184568285942078, "mean_norm/layer19": 9.19563889503479, "mean_norm/layer2": 8.397359848022461, "mean_norm/layer20": 9.282590985298157, "mean_norm/layer21": 9.245154798030853, "mean_norm/layer22": 9.65415096282959, "mean_norm/layer23": 9.63697373867035, "mean_norm/layer3": 9.368990659713745, "mean_norm/layer4": 8.922351777553558, "mean_norm/layer5": 9.89015644788742, "mean_norm/layer6": 8.708074033260345, "mean_norm/layer7": 8.937257945537567, "mean_norm/layer8": 9.134815633296967, "mean_norm/layer9": 9.110543191432953, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 2950 }, { "epoch": 1.23, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4459871097536738, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8599984645843506, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7959, "eval_samples_per_second": 20.431, "eval_steps_per_second": 0.678, "step": 2950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.25, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8447, "max_norm": 17.19088363647461, "max_norm/layer0": 14.864973068237305, "max_norm/layer1": 15.62208080291748, "max_norm/layer10": 16.26564598083496, "max_norm/layer11": 15.690491676330566, "max_norm/layer12": 16.09348487854004, "max_norm/layer13": 14.608466148376465, "max_norm/layer14": 15.872156143188477, "max_norm/layer15": 16.789859771728516, "max_norm/layer16": 14.985624313354492, "max_norm/layer17": 16.59108543395996, "max_norm/layer18": 15.49613094329834, "max_norm/layer19": 15.138503074645996, "max_norm/layer2": 13.480121612548828, "max_norm/layer20": 16.039661407470703, "max_norm/layer21": 15.726054191589355, "max_norm/layer22": 15.85644245147705, "max_norm/layer23": 15.822321891784668, "max_norm/layer3": 15.016472816467285, "max_norm/layer4": 15.327754020690918, "max_norm/layer5": 17.19088363647461, "max_norm/layer6": 14.556528091430664, "max_norm/layer7": 15.827574729919434, "max_norm/layer8": 16.28036880493164, "max_norm/layer9": 16.034198760986328, "mean_norm": 9.205305655797323, "mean_norm/layer0": 8.828269600868225, "mean_norm/layer1": 8.897296965122223, "mean_norm/layer10": 9.163637578487396, "mean_norm/layer11": 9.2901731133461, "mean_norm/layer12": 9.460385203361511, "mean_norm/layer13": 9.11164516210556, "mean_norm/layer14": 9.305707812309265, "mean_norm/layer15": 9.43520051240921, "mean_norm/layer16": 9.157863140106201, "mean_norm/layer17": 9.406088531017303, "mean_norm/layer18": 9.200478971004486, "mean_norm/layer19": 9.211331129074097, "mean_norm/layer2": 8.401508867740631, "mean_norm/layer20": 9.298927962779999, "mean_norm/layer21": 9.261110067367554, "mean_norm/layer22": 9.6760755777359, "mean_norm/layer23": 9.658278584480286, "mean_norm/layer3": 9.3849378824234, "mean_norm/layer4": 8.932135999202728, "mean_norm/layer5": 9.912546157836914, "mean_norm/layer6": 8.71561086177826, "mean_norm/layer7": 8.947454273700714, "mean_norm/layer8": 9.147588908672333, "mean_norm/layer9": 9.123082876205444, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3000 }, { "epoch": 1.25, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4469808512105393, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8544092178344727, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8166, "eval_samples_per_second": 20.395, "eval_steps_per_second": 0.677, "step": 3000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.27, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8494, "max_norm": 17.332006454467773, "max_norm/layer0": 14.971895217895508, "max_norm/layer1": 15.706180572509766, "max_norm/layer10": 16.39055633544922, "max_norm/layer11": 15.820825576782227, "max_norm/layer12": 16.230440139770508, "max_norm/layer13": 14.713774681091309, "max_norm/layer14": 15.964306831359863, "max_norm/layer15": 16.913372039794922, "max_norm/layer16": 15.084409713745117, "max_norm/layer17": 16.690601348876953, "max_norm/layer18": 15.592001914978027, "max_norm/layer19": 15.248854637145996, "max_norm/layer2": 13.564947128295898, "max_norm/layer20": 16.140636444091797, "max_norm/layer21": 15.825383186340332, "max_norm/layer22": 15.98045825958252, "max_norm/layer23": 15.944609642028809, "max_norm/layer3": 15.109355926513672, "max_norm/layer4": 15.39990234375, "max_norm/layer5": 17.332006454467773, "max_norm/layer6": 14.59697437286377, "max_norm/layer7": 15.948881149291992, "max_norm/layer8": 16.376832962036133, "max_norm/layer9": 16.13812828063965, "mean_norm": 9.220104138056437, "mean_norm/layer0": 8.839670896530151, "mean_norm/layer1": 8.908665537834167, "mean_norm/layer10": 9.176793336868286, "mean_norm/layer11": 9.305428922176361, "mean_norm/layer12": 9.478922605514526, "mean_norm/layer13": 9.125423610210419, "mean_norm/layer14": 9.321944952011108, "mean_norm/layer15": 9.452899932861328, "mean_norm/layer16": 9.172569692134857, "mean_norm/layer17": 9.424022793769836, "mean_norm/layer18": 9.216603875160217, "mean_norm/layer19": 9.227488934993744, "mean_norm/layer2": 8.40572214126587, "mean_norm/layer20": 9.315212488174438, "mean_norm/layer21": 9.277587234973907, "mean_norm/layer22": 9.698153376579285, "mean_norm/layer23": 9.679868876934052, "mean_norm/layer3": 9.401076316833496, "mean_norm/layer4": 8.941973567008972, "mean_norm/layer5": 9.935079276561737, "mean_norm/layer6": 8.72326409816742, "mean_norm/layer7": 8.957727432250977, "mean_norm/layer8": 9.160670280456543, "mean_norm/layer9": 9.135729134082794, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3050 }, { "epoch": 1.27, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44626292370904874, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8586294651031494, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8056, "eval_samples_per_second": 20.414, "eval_steps_per_second": 0.678, "step": 3050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.29, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.851, "max_norm": 17.45079231262207, "max_norm/layer0": 15.07141399383545, "max_norm/layer1": 15.788281440734863, "max_norm/layer10": 16.522247314453125, "max_norm/layer11": 15.996971130371094, "max_norm/layer12": 16.32065200805664, "max_norm/layer13": 14.813121795654297, "max_norm/layer14": 16.042503356933594, "max_norm/layer15": 17.024852752685547, "max_norm/layer16": 15.163915634155273, "max_norm/layer17": 16.79519271850586, "max_norm/layer18": 15.687070846557617, "max_norm/layer19": 15.342894554138184, "max_norm/layer2": 13.622076034545898, "max_norm/layer20": 16.25835418701172, "max_norm/layer21": 15.937350273132324, "max_norm/layer22": 16.101654052734375, "max_norm/layer23": 16.047069549560547, "max_norm/layer3": 15.202547073364258, "max_norm/layer4": 15.467806816101074, "max_norm/layer5": 17.45079231262207, "max_norm/layer6": 14.651065826416016, "max_norm/layer7": 16.03363609313965, "max_norm/layer8": 16.475841522216797, "max_norm/layer9": 16.232484817504883, "mean_norm": 9.234526852766672, "mean_norm/layer0": 8.850844144821167, "mean_norm/layer1": 8.919748723506927, "mean_norm/layer10": 9.189667701721191, "mean_norm/layer11": 9.320032119750977, "mean_norm/layer12": 9.49708503484726, "mean_norm/layer13": 9.138881921768188, "mean_norm/layer14": 9.337770938873291, "mean_norm/layer15": 9.47018826007843, "mean_norm/layer16": 9.186775863170624, "mean_norm/layer17": 9.441416263580322, "mean_norm/layer18": 9.232204139232635, "mean_norm/layer19": 9.243465781211853, "mean_norm/layer2": 8.40979117155075, "mean_norm/layer20": 9.331261694431305, "mean_norm/layer21": 9.293141663074493, "mean_norm/layer22": 9.719446420669556, "mean_norm/layer23": 9.700763463973999, "mean_norm/layer3": 9.41711300611496, "mean_norm/layer4": 8.95202124118805, "mean_norm/layer5": 9.957186877727509, "mean_norm/layer6": 8.730644345283508, "mean_norm/layer7": 8.96764749288559, "mean_norm/layer8": 9.17331349849701, "mean_norm/layer9": 9.148232698440552, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3100 }, { "epoch": 1.29, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44737429170570653, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8489952087402344, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5802, "eval_samples_per_second": 20.811, "eval_steps_per_second": 0.691, "step": 3100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.32, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8352, "max_norm": 17.570619583129883, "max_norm/layer0": 15.160906791687012, "max_norm/layer1": 15.87808609008789, "max_norm/layer10": 16.663211822509766, "max_norm/layer11": 16.07549285888672, "max_norm/layer12": 16.4635066986084, "max_norm/layer13": 14.898290634155273, "max_norm/layer14": 16.140918731689453, "max_norm/layer15": 17.153202056884766, "max_norm/layer16": 15.241742134094238, "max_norm/layer17": 16.903993606567383, "max_norm/layer18": 15.782885551452637, "max_norm/layer19": 15.452775001525879, "max_norm/layer2": 13.689221382141113, "max_norm/layer20": 16.361042022705078, "max_norm/layer21": 16.02024269104004, "max_norm/layer22": 16.25684928894043, "max_norm/layer23": 16.14984703063965, "max_norm/layer3": 15.28460693359375, "max_norm/layer4": 15.529900550842285, "max_norm/layer5": 17.570619583129883, "max_norm/layer6": 14.70571231842041, "max_norm/layer7": 16.162504196166992, "max_norm/layer8": 16.585596084594727, "max_norm/layer9": 16.349956512451172, "mean_norm": 9.248786879082521, "mean_norm/layer0": 8.861954629421234, "mean_norm/layer1": 8.930564403533936, "mean_norm/layer10": 9.202419340610504, "mean_norm/layer11": 9.334671199321747, "mean_norm/layer12": 9.51488173007965, "mean_norm/layer13": 9.152113914489746, "mean_norm/layer14": 9.353131890296936, "mean_norm/layer15": 9.487328350543976, "mean_norm/layer16": 9.201062262058258, "mean_norm/layer17": 9.458812892436981, "mean_norm/layer18": 9.247539579868317, "mean_norm/layer19": 9.259144306182861, "mean_norm/layer2": 8.413836479187012, "mean_norm/layer20": 9.347349166870117, "mean_norm/layer21": 9.308494091033936, "mean_norm/layer22": 9.74064427614212, "mean_norm/layer23": 9.721216857433319, "mean_norm/layer3": 9.432927966117859, "mean_norm/layer4": 8.961803197860718, "mean_norm/layer5": 9.979026854038239, "mean_norm/layer6": 8.738053262233734, "mean_norm/layer7": 8.977501392364502, "mean_norm/layer8": 9.185922145843506, "mean_norm/layer9": 9.160484910011292, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3150 }, { "epoch": 1.32, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44814089225814563, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.843223810195923, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8154, "eval_samples_per_second": 20.397, "eval_steps_per_second": 0.677, "step": 3150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.34, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8437, "max_norm": 17.70356559753418, "max_norm/layer0": 15.250068664550781, "max_norm/layer1": 15.979663848876953, "max_norm/layer10": 16.79854965209961, "max_norm/layer11": 16.147912979125977, "max_norm/layer12": 16.560741424560547, "max_norm/layer13": 14.95504379272461, "max_norm/layer14": 16.233966827392578, "max_norm/layer15": 17.285449981689453, "max_norm/layer16": 15.354681015014648, "max_norm/layer17": 17.01114273071289, "max_norm/layer18": 15.888689994812012, "max_norm/layer19": 15.555651664733887, "max_norm/layer2": 13.74233341217041, "max_norm/layer20": 16.473976135253906, "max_norm/layer21": 16.12687873840332, "max_norm/layer22": 16.351245880126953, "max_norm/layer23": 16.270776748657227, "max_norm/layer3": 15.34660530090332, "max_norm/layer4": 15.623671531677246, "max_norm/layer5": 17.70356559753418, "max_norm/layer6": 14.763014793395996, "max_norm/layer7": 16.251935958862305, "max_norm/layer8": 16.690643310546875, "max_norm/layer9": 16.44407844543457, "mean_norm": 9.263032605250677, "mean_norm/layer0": 8.873132646083832, "mean_norm/layer1": 8.94136381149292, "mean_norm/layer10": 9.215128123760223, "mean_norm/layer11": 9.349354445934296, "mean_norm/layer12": 9.532716155052185, "mean_norm/layer13": 9.165308952331543, "mean_norm/layer14": 9.368605971336365, "mean_norm/layer15": 9.50459748506546, "mean_norm/layer16": 9.215272843837738, "mean_norm/layer17": 9.476195633411407, "mean_norm/layer18": 9.262809813022614, "mean_norm/layer19": 9.27439969778061, "mean_norm/layer2": 8.417843043804169, "mean_norm/layer20": 9.363462388515472, "mean_norm/layer21": 9.324271738529205, "mean_norm/layer22": 9.761922836303711, "mean_norm/layer23": 9.74175089597702, "mean_norm/layer3": 9.448581278324127, "mean_norm/layer4": 8.971577763557434, "mean_norm/layer5": 10.000657439231873, "mean_norm/layer6": 8.745424628257751, "mean_norm/layer7": 8.987475097179413, "mean_norm/layer8": 9.198350310325623, "mean_norm/layer9": 9.172579526901245, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3200 }, { "epoch": 1.34, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.447702834799609, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8433425426483154, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.819, "eval_samples_per_second": 20.391, "eval_steps_per_second": 0.677, "step": 3200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.36, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8519, "max_norm": 17.860597610473633, "max_norm/layer0": 15.346634864807129, "max_norm/layer1": 16.065568923950195, "max_norm/layer10": 16.915620803833008, "max_norm/layer11": 16.206560134887695, "max_norm/layer12": 16.65528106689453, "max_norm/layer13": 15.02581787109375, "max_norm/layer14": 16.34491539001465, "max_norm/layer15": 17.41537094116211, "max_norm/layer16": 15.447769165039062, "max_norm/layer17": 17.1556339263916, "max_norm/layer18": 15.984742164611816, "max_norm/layer19": 15.66572380065918, "max_norm/layer2": 13.785428047180176, "max_norm/layer20": 16.59414291381836, "max_norm/layer21": 16.224258422851562, "max_norm/layer22": 16.447364807128906, "max_norm/layer23": 16.371061325073242, "max_norm/layer3": 15.438834190368652, "max_norm/layer4": 15.713982582092285, "max_norm/layer5": 17.860597610473633, "max_norm/layer6": 14.833402633666992, "max_norm/layer7": 16.37326431274414, "max_norm/layer8": 16.806903839111328, "max_norm/layer9": 16.539751052856445, "mean_norm": 9.277176524202028, "mean_norm/layer0": 8.884214758872986, "mean_norm/layer1": 8.952378034591675, "mean_norm/layer10": 9.227916955947876, "mean_norm/layer11": 9.363875806331635, "mean_norm/layer12": 9.550445020198822, "mean_norm/layer13": 9.178218245506287, "mean_norm/layer14": 9.384025871753693, "mean_norm/layer15": 9.521648645401001, "mean_norm/layer16": 9.22939395904541, "mean_norm/layer17": 9.493267953395844, "mean_norm/layer18": 9.277807056903839, "mean_norm/layer19": 9.289763867855072, "mean_norm/layer2": 8.421853244304657, "mean_norm/layer20": 9.379169642925262, "mean_norm/layer21": 9.339562237262726, "mean_norm/layer22": 9.782929956912994, "mean_norm/layer23": 9.762168943881989, "mean_norm/layer3": 9.464285552501678, "mean_norm/layer4": 8.981122076511383, "mean_norm/layer5": 10.022289276123047, "mean_norm/layer6": 8.752665579319, "mean_norm/layer7": 8.997315227985382, "mean_norm/layer8": 9.211067497730255, "mean_norm/layer9": 9.184851169586182, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3250 }, { "epoch": 1.36, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44898455847458657, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8393099308013916, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8059, "eval_samples_per_second": 20.413, "eval_steps_per_second": 0.678, "step": 3250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.38, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8446, "max_norm": 18.016963958740234, "max_norm/layer0": 15.441362380981445, "max_norm/layer1": 16.141338348388672, "max_norm/layer10": 17.031034469604492, "max_norm/layer11": 16.273303985595703, "max_norm/layer12": 16.74533462524414, "max_norm/layer13": 15.093159675598145, "max_norm/layer14": 16.452301025390625, "max_norm/layer15": 17.527395248413086, "max_norm/layer16": 15.512605667114258, "max_norm/layer17": 17.280061721801758, "max_norm/layer18": 16.084121704101562, "max_norm/layer19": 15.759353637695312, "max_norm/layer2": 13.81966781616211, "max_norm/layer20": 16.718875885009766, "max_norm/layer21": 16.32035255432129, "max_norm/layer22": 16.567575454711914, "max_norm/layer23": 16.46967124938965, "max_norm/layer3": 15.51447582244873, "max_norm/layer4": 15.789702415466309, "max_norm/layer5": 18.016963958740234, "max_norm/layer6": 14.896657943725586, "max_norm/layer7": 16.477813720703125, "max_norm/layer8": 16.922813415527344, "max_norm/layer9": 16.6334171295166, "mean_norm": 9.290889439483484, "mean_norm/layer0": 8.895033597946167, "mean_norm/layer1": 8.963081002235413, "mean_norm/layer10": 9.240162551403046, "mean_norm/layer11": 9.377988994121552, "mean_norm/layer12": 9.567772030830383, "mean_norm/layer13": 9.190891683101654, "mean_norm/layer14": 9.399105072021484, "mean_norm/layer15": 9.538142681121826, "mean_norm/layer16": 9.24304586648941, "mean_norm/layer17": 9.510010719299316, "mean_norm/layer18": 9.292459189891815, "mean_norm/layer19": 9.304514169692993, "mean_norm/layer2": 8.425727248191833, "mean_norm/layer20": 9.394480288028717, "mean_norm/layer21": 9.354299426078796, "mean_norm/layer22": 9.803248167037964, "mean_norm/layer23": 9.781766414642334, "mean_norm/layer3": 9.47944289445877, "mean_norm/layer4": 8.990542650222778, "mean_norm/layer5": 10.04342132806778, "mean_norm/layer6": 8.759501457214355, "mean_norm/layer7": 9.006960988044739, "mean_norm/layer8": 9.223146975040436, "mean_norm/layer9": 9.196601152420044, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3300 }, { "epoch": 1.38, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44939016723249087, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8373703956604004, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8356, "eval_samples_per_second": 20.362, "eval_steps_per_second": 0.676, "step": 3300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.4, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8313, "max_norm": 18.179218292236328, "max_norm/layer0": 15.533577919006348, "max_norm/layer1": 16.243879318237305, "max_norm/layer10": 17.173385620117188, "max_norm/layer11": 16.345731735229492, "max_norm/layer12": 16.848569869995117, "max_norm/layer13": 15.166905403137207, "max_norm/layer14": 16.53302764892578, "max_norm/layer15": 17.655122756958008, "max_norm/layer16": 15.596038818359375, "max_norm/layer17": 17.404146194458008, "max_norm/layer18": 16.180326461791992, "max_norm/layer19": 15.84206485748291, "max_norm/layer2": 13.853592872619629, "max_norm/layer20": 16.853952407836914, "max_norm/layer21": 16.416898727416992, "max_norm/layer22": 16.667673110961914, "max_norm/layer23": 16.5629940032959, "max_norm/layer3": 15.585241317749023, "max_norm/layer4": 15.886917114257812, "max_norm/layer5": 18.179218292236328, "max_norm/layer6": 14.965940475463867, "max_norm/layer7": 16.574649810791016, "max_norm/layer8": 17.033422470092773, "max_norm/layer9": 16.74019432067871, "mean_norm": 9.304636073609194, "mean_norm/layer0": 8.90590125322342, "mean_norm/layer1": 8.973723888397217, "mean_norm/layer10": 9.252578437328339, "mean_norm/layer11": 9.392187356948853, "mean_norm/layer12": 9.584810256958008, "mean_norm/layer13": 9.203449964523315, "mean_norm/layer14": 9.413988173007965, "mean_norm/layer15": 9.554635107517242, "mean_norm/layer16": 9.25671535730362, "mean_norm/layer17": 9.526697039604187, "mean_norm/layer18": 9.306841850280762, "mean_norm/layer19": 9.31952553987503, "mean_norm/layer2": 8.429565906524658, "mean_norm/layer20": 9.409839034080505, "mean_norm/layer21": 9.369287729263306, "mean_norm/layer22": 9.82382595539093, "mean_norm/layer23": 9.801779389381409, "mean_norm/layer3": 9.494613111019135, "mean_norm/layer4": 8.999967634677887, "mean_norm/layer5": 10.064538836479187, "mean_norm/layer6": 8.766620993614197, "mean_norm/layer7": 9.016564190387726, "mean_norm/layer8": 9.235347211360931, "mean_norm/layer9": 9.208261549472809, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3350 }, { "epoch": 1.4, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4490372876131141, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8347883224487305, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.7963, "eval_samples_per_second": 22.322, "eval_steps_per_second": 0.741, "step": 3350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.42, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8251, "max_norm": 18.336759567260742, "max_norm/layer0": 15.618881225585938, "max_norm/layer1": 16.339771270751953, "max_norm/layer10": 17.287466049194336, "max_norm/layer11": 16.401472091674805, "max_norm/layer12": 16.958864212036133, "max_norm/layer13": 15.245092391967773, "max_norm/layer14": 16.62425994873047, "max_norm/layer15": 17.777263641357422, "max_norm/layer16": 15.674489974975586, "max_norm/layer17": 17.523509979248047, "max_norm/layer18": 16.255813598632812, "max_norm/layer19": 15.934908866882324, "max_norm/layer2": 13.882692337036133, "max_norm/layer20": 16.969314575195312, "max_norm/layer21": 16.508270263671875, "max_norm/layer22": 16.763980865478516, "max_norm/layer23": 16.67099380493164, "max_norm/layer3": 15.66022777557373, "max_norm/layer4": 15.979378700256348, "max_norm/layer5": 18.336759567260742, "max_norm/layer6": 15.03795337677002, "max_norm/layer7": 16.673524856567383, "max_norm/layer8": 17.149028778076172, "max_norm/layer9": 16.84016227722168, "mean_norm": 9.318130704263845, "mean_norm/layer0": 8.916600942611694, "mean_norm/layer1": 8.984344899654388, "mean_norm/layer10": 9.264764606952667, "mean_norm/layer11": 9.40614765882492, "mean_norm/layer12": 9.601603388786316, "mean_norm/layer13": 9.216069042682648, "mean_norm/layer14": 9.428646862506866, "mean_norm/layer15": 9.570810496807098, "mean_norm/layer16": 9.27027541399002, "mean_norm/layer17": 9.542983949184418, "mean_norm/layer18": 9.321069478988647, "mean_norm/layer19": 9.3338503241539, "mean_norm/layer2": 8.43327808380127, "mean_norm/layer20": 9.42466515302658, "mean_norm/layer21": 9.383947730064392, "mean_norm/layer22": 9.844399809837341, "mean_norm/layer23": 9.821134805679321, "mean_norm/layer3": 9.50949090719223, "mean_norm/layer4": 9.009099662303925, "mean_norm/layer5": 10.085379660129547, "mean_norm/layer6": 8.773491621017456, "mean_norm/layer7": 9.025936245918274, "mean_norm/layer8": 9.247284710407257, "mean_norm/layer9": 9.219861447811127, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3400 }, { "epoch": 1.42, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.44893588542363805, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8318352699279785, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6041, "eval_samples_per_second": 20.769, "eval_steps_per_second": 0.689, "step": 3400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.44, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8429, "max_norm": 18.477962493896484, "max_norm/layer0": 15.704484939575195, "max_norm/layer1": 16.429656982421875, "max_norm/layer10": 17.405029296875, "max_norm/layer11": 16.489473342895508, "max_norm/layer12": 17.07954978942871, "max_norm/layer13": 15.339924812316895, "max_norm/layer14": 16.736328125, "max_norm/layer15": 17.899723052978516, "max_norm/layer16": 15.776835441589355, "max_norm/layer17": 17.662168502807617, "max_norm/layer18": 16.360383987426758, "max_norm/layer19": 16.030488967895508, "max_norm/layer2": 13.910673141479492, "max_norm/layer20": 17.0791015625, "max_norm/layer21": 16.60880470275879, "max_norm/layer22": 16.860157012939453, "max_norm/layer23": 16.763296127319336, "max_norm/layer3": 15.720104217529297, "max_norm/layer4": 16.067779541015625, "max_norm/layer5": 18.477962493896484, "max_norm/layer6": 15.11044979095459, "max_norm/layer7": 16.761457443237305, "max_norm/layer8": 17.262792587280273, "max_norm/layer9": 16.94117546081543, "mean_norm": 9.331590088705221, "mean_norm/layer0": 8.927314579486847, "mean_norm/layer1": 8.99471640586853, "mean_norm/layer10": 9.277050256729126, "mean_norm/layer11": 9.420108437538147, "mean_norm/layer12": 9.61855810880661, "mean_norm/layer13": 9.22856056690216, "mean_norm/layer14": 9.443263828754425, "mean_norm/layer15": 9.586838006973267, "mean_norm/layer16": 9.283744394779205, "mean_norm/layer17": 9.559471309185028, "mean_norm/layer18": 9.335309386253357, "mean_norm/layer19": 9.348252415657043, "mean_norm/layer2": 8.4369957447052, "mean_norm/layer20": 9.439510464668274, "mean_norm/layer21": 9.398659586906433, "mean_norm/layer22": 9.864253401756287, "mean_norm/layer23": 9.840354681015015, "mean_norm/layer3": 9.524330019950867, "mean_norm/layer4": 9.01804405450821, "mean_norm/layer5": 10.106251001358032, "mean_norm/layer6": 8.780368089675903, "mean_norm/layer7": 9.035491406917572, "mean_norm/layer8": 9.259211540222168, "mean_norm/layer9": 9.231504440307617, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3450 }, { "epoch": 1.44, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4497430468518676, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.828789472579956, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.7908, "eval_samples_per_second": 22.334, "eval_steps_per_second": 0.741, "step": 3450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.46, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8397, "max_norm": 18.612791061401367, "max_norm/layer0": 15.785677909851074, "max_norm/layer1": 16.514942169189453, "max_norm/layer10": 17.51824951171875, "max_norm/layer11": 16.590362548828125, "max_norm/layer12": 17.19257354736328, "max_norm/layer13": 15.409317970275879, "max_norm/layer14": 16.837434768676758, "max_norm/layer15": 17.997446060180664, "max_norm/layer16": 15.877601623535156, "max_norm/layer17": 17.79769515991211, "max_norm/layer18": 16.465822219848633, "max_norm/layer19": 16.119728088378906, "max_norm/layer2": 13.954423904418945, "max_norm/layer20": 17.191173553466797, "max_norm/layer21": 16.693696975708008, "max_norm/layer22": 16.954496383666992, "max_norm/layer23": 16.847951889038086, "max_norm/layer3": 15.772260665893555, "max_norm/layer4": 16.147335052490234, "max_norm/layer5": 18.612791061401367, "max_norm/layer6": 15.16303825378418, "max_norm/layer7": 16.8575439453125, "max_norm/layer8": 17.3731689453125, "max_norm/layer9": 17.055498123168945, "mean_norm": 9.344837203621864, "mean_norm/layer0": 8.937843799591064, "mean_norm/layer1": 9.005088448524475, "mean_norm/layer10": 9.289023041725159, "mean_norm/layer11": 9.433656215667725, "mean_norm/layer12": 9.635209679603577, "mean_norm/layer13": 9.24088716506958, "mean_norm/layer14": 9.457638919353485, "mean_norm/layer15": 9.602668046951294, "mean_norm/layer16": 9.296828985214233, "mean_norm/layer17": 9.575341761112213, "mean_norm/layer18": 9.349262356758118, "mean_norm/layer19": 9.362391829490662, "mean_norm/layer2": 8.44077605009079, "mean_norm/layer20": 9.454284369945526, "mean_norm/layer21": 9.413063526153564, "mean_norm/layer22": 9.883745014667511, "mean_norm/layer23": 9.859206199645996, "mean_norm/layer3": 9.539020895957947, "mean_norm/layer4": 9.027145206928253, "mean_norm/layer5": 10.12680846452713, "mean_norm/layer6": 8.787212014198303, "mean_norm/layer7": 9.044856607913971, "mean_norm/layer8": 9.271096289157867, "mean_norm/layer9": 9.2430379986763, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3500 }, { "epoch": 1.46, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4511099483660051, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8216705322265625, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.563, "eval_samples_per_second": 20.842, "eval_steps_per_second": 0.692, "step": 3500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.48, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.833, "max_norm": 18.753446578979492, "max_norm/layer0": 15.853753089904785, "max_norm/layer1": 16.583667755126953, "max_norm/layer10": 17.616392135620117, "max_norm/layer11": 16.686279296875, "max_norm/layer12": 17.2836856842041, "max_norm/layer13": 15.484760284423828, "max_norm/layer14": 16.939178466796875, "max_norm/layer15": 18.10690689086914, "max_norm/layer16": 15.978145599365234, "max_norm/layer17": 17.911317825317383, "max_norm/layer18": 16.60814666748047, "max_norm/layer19": 16.217397689819336, "max_norm/layer2": 13.995329856872559, "max_norm/layer20": 17.310771942138672, "max_norm/layer21": 16.784269332885742, "max_norm/layer22": 17.0494384765625, "max_norm/layer23": 16.949352264404297, "max_norm/layer3": 15.835954666137695, "max_norm/layer4": 16.24813461303711, "max_norm/layer5": 18.753446578979492, "max_norm/layer6": 15.2390718460083, "max_norm/layer7": 16.97339630126953, "max_norm/layer8": 17.472185134887695, "max_norm/layer9": 17.17030906677246, "mean_norm": 9.358108803629875, "mean_norm/layer0": 8.948367297649384, "mean_norm/layer1": 9.015483260154724, "mean_norm/layer10": 9.300959289073944, "mean_norm/layer11": 9.44746309518814, "mean_norm/layer12": 9.651969850063324, "mean_norm/layer13": 9.253294944763184, "mean_norm/layer14": 9.472301483154297, "mean_norm/layer15": 9.618704080581665, "mean_norm/layer16": 9.310149073600769, "mean_norm/layer17": 9.591234683990479, "mean_norm/layer18": 9.36311811208725, "mean_norm/layer19": 9.376516222953796, "mean_norm/layer2": 8.444473266601562, "mean_norm/layer20": 9.46895295381546, "mean_norm/layer21": 9.42733383178711, "mean_norm/layer22": 9.903033971786499, "mean_norm/layer23": 9.87805551290512, "mean_norm/layer3": 9.553642868995667, "mean_norm/layer4": 9.036168217658997, "mean_norm/layer5": 10.147434830665588, "mean_norm/layer6": 8.794258058071136, "mean_norm/layer7": 9.054118037223816, "mean_norm/layer8": 9.283077836036682, "mean_norm/layer9": 9.25450050830841, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3550 }, { "epoch": 1.48, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4499134025301874, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.825397253036499, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8024, "eval_samples_per_second": 20.42, "eval_steps_per_second": 0.678, "step": 3550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.5, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8209, "max_norm": 18.887266159057617, "max_norm/layer0": 15.928442001342773, "max_norm/layer1": 16.638465881347656, "max_norm/layer10": 17.713111877441406, "max_norm/layer11": 16.772506713867188, "max_norm/layer12": 17.393291473388672, "max_norm/layer13": 15.576926231384277, "max_norm/layer14": 17.04795265197754, "max_norm/layer15": 18.229637145996094, "max_norm/layer16": 16.101669311523438, "max_norm/layer17": 18.021533966064453, "max_norm/layer18": 16.741031646728516, "max_norm/layer19": 16.309358596801758, "max_norm/layer2": 14.079461097717285, "max_norm/layer20": 17.407546997070312, "max_norm/layer21": 16.90997314453125, "max_norm/layer22": 17.160221099853516, "max_norm/layer23": 17.035873413085938, "max_norm/layer3": 15.932682991027832, "max_norm/layer4": 16.348690032958984, "max_norm/layer5": 18.887266159057617, "max_norm/layer6": 15.295527458190918, "max_norm/layer7": 17.097925186157227, "max_norm/layer8": 17.554088592529297, "max_norm/layer9": 17.282934188842773, "mean_norm": 9.371505024532476, "mean_norm/layer0": 8.959096014499664, "mean_norm/layer1": 9.026121318340302, "mean_norm/layer10": 9.313242495059967, "mean_norm/layer11": 9.461414635181427, "mean_norm/layer12": 9.668856620788574, "mean_norm/layer13": 9.265742599964142, "mean_norm/layer14": 9.486914694309235, "mean_norm/layer15": 9.634682357311249, "mean_norm/layer16": 9.323372840881348, "mean_norm/layer17": 9.60727709531784, "mean_norm/layer18": 9.377022087574005, "mean_norm/layer19": 9.390734195709229, "mean_norm/layer2": 8.448146045207977, "mean_norm/layer20": 9.483981490135193, "mean_norm/layer21": 9.441752195358276, "mean_norm/layer22": 9.922874212265015, "mean_norm/layer23": 9.897243618965149, "mean_norm/layer3": 9.568353295326233, "mean_norm/layer4": 9.04521918296814, "mean_norm/layer5": 10.168164014816284, "mean_norm/layer6": 8.801159620285034, "mean_norm/layer7": 9.063514709472656, "mean_norm/layer8": 9.295092165470123, "mean_norm/layer9": 9.266143083572388, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3600 }, { "epoch": 1.5, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45093148051252724, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8219504356384277, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7946, "eval_samples_per_second": 20.433, "eval_steps_per_second": 0.678, "step": 3600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.52, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8336, "max_norm": 19.024261474609375, "max_norm/layer0": 16.005525588989258, "max_norm/layer1": 16.7034854888916, "max_norm/layer10": 17.81429100036621, "max_norm/layer11": 16.852542877197266, "max_norm/layer12": 17.491962432861328, "max_norm/layer13": 15.668417930603027, "max_norm/layer14": 17.154603958129883, "max_norm/layer15": 18.34808921813965, "max_norm/layer16": 16.209043502807617, "max_norm/layer17": 18.15737533569336, "max_norm/layer18": 16.833559036254883, "max_norm/layer19": 16.41221046447754, "max_norm/layer2": 14.156972885131836, "max_norm/layer20": 17.505290985107422, "max_norm/layer21": 17.016029357910156, "max_norm/layer22": 17.268396377563477, "max_norm/layer23": 17.125720977783203, "max_norm/layer3": 16.029821395874023, "max_norm/layer4": 16.439924240112305, "max_norm/layer5": 19.024261474609375, "max_norm/layer6": 15.357059478759766, "max_norm/layer7": 17.220069885253906, "max_norm/layer8": 17.65226173400879, "max_norm/layer9": 17.398624420166016, "mean_norm": 9.384601970513662, "mean_norm/layer0": 8.969634473323822, "mean_norm/layer1": 9.036478281021118, "mean_norm/layer10": 9.325130581855774, "mean_norm/layer11": 9.475057005882263, "mean_norm/layer12": 9.685044169425964, "mean_norm/layer13": 9.277792394161224, "mean_norm/layer14": 9.501095294952393, "mean_norm/layer15": 9.650285363197327, "mean_norm/layer16": 9.336541652679443, "mean_norm/layer17": 9.623004257678986, "mean_norm/layer18": 9.390738606452942, "mean_norm/layer19": 9.404767334461212, "mean_norm/layer2": 8.451732337474823, "mean_norm/layer20": 9.498468458652496, "mean_norm/layer21": 9.456099450588226, "mean_norm/layer22": 9.942264795303345, "mean_norm/layer23": 9.915738880634308, "mean_norm/layer3": 9.582852602005005, "mean_norm/layer4": 9.054056227207184, "mean_norm/layer5": 10.188653767108917, "mean_norm/layer6": 8.807803988456726, "mean_norm/layer7": 9.072685480117798, "mean_norm/layer8": 9.306782305240631, "mean_norm/layer9": 9.277739584445953, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3650 }, { "epoch": 1.52, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45114645315421653, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8175899982452393, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5432, "eval_samples_per_second": 20.878, "eval_steps_per_second": 0.693, "step": 3650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.54, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8139, "max_norm": 19.137977600097656, "max_norm/layer0": 16.0833740234375, "max_norm/layer1": 16.776784896850586, "max_norm/layer10": 17.91156578063965, "max_norm/layer11": 16.949214935302734, "max_norm/layer12": 17.602840423583984, "max_norm/layer13": 15.76510238647461, "max_norm/layer14": 17.248186111450195, "max_norm/layer15": 18.48503303527832, "max_norm/layer16": 16.319406509399414, "max_norm/layer17": 18.264812469482422, "max_norm/layer18": 16.932689666748047, "max_norm/layer19": 16.511192321777344, "max_norm/layer2": 14.22626781463623, "max_norm/layer20": 17.621082305908203, "max_norm/layer21": 17.110122680664062, "max_norm/layer22": 17.374183654785156, "max_norm/layer23": 17.20750617980957, "max_norm/layer3": 16.11916732788086, "max_norm/layer4": 16.518123626708984, "max_norm/layer5": 19.137977600097656, "max_norm/layer6": 15.443400382995605, "max_norm/layer7": 17.33040428161621, "max_norm/layer8": 17.752338409423828, "max_norm/layer9": 17.495275497436523, "mean_norm": 9.39769247919321, "mean_norm/layer0": 8.980181157588959, "mean_norm/layer1": 9.046735346317291, "mean_norm/layer10": 9.337104260921478, "mean_norm/layer11": 9.48857319355011, "mean_norm/layer12": 9.701455056667328, "mean_norm/layer13": 9.290168941020966, "mean_norm/layer14": 9.51529061794281, "mean_norm/layer15": 9.665862381458282, "mean_norm/layer16": 9.349638223648071, "mean_norm/layer17": 9.638719916343689, "mean_norm/layer18": 9.40440809726715, "mean_norm/layer19": 9.418926656246185, "mean_norm/layer2": 8.45537531375885, "mean_norm/layer20": 9.513044118881226, "mean_norm/layer21": 9.470202088356018, "mean_norm/layer22": 9.961255609989166, "mean_norm/layer23": 9.934356808662415, "mean_norm/layer3": 9.597356498241425, "mean_norm/layer4": 9.062905848026276, "mean_norm/layer5": 10.208882927894592, "mean_norm/layer6": 8.814568221569061, "mean_norm/layer7": 9.08190244436264, "mean_norm/layer8": 9.31855446100235, "mean_norm/layer9": 9.289151310920715, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3700 }, { "epoch": 1.54, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45146282798538184, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8167974948883057, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5485, "eval_samples_per_second": 20.869, "eval_steps_per_second": 0.693, "step": 3700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.57, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8155, "max_norm": 19.25054931640625, "max_norm/layer0": 16.164255142211914, "max_norm/layer1": 16.874256134033203, "max_norm/layer10": 18.021665573120117, "max_norm/layer11": 17.04458236694336, "max_norm/layer12": 17.710533142089844, "max_norm/layer13": 15.850334167480469, "max_norm/layer14": 17.3418025970459, "max_norm/layer15": 18.614669799804688, "max_norm/layer16": 16.4307804107666, "max_norm/layer17": 18.387475967407227, "max_norm/layer18": 17.02359390258789, "max_norm/layer19": 16.638124465942383, "max_norm/layer2": 14.282529830932617, "max_norm/layer20": 17.732723236083984, "max_norm/layer21": 17.204208374023438, "max_norm/layer22": 17.47235870361328, "max_norm/layer23": 17.30570411682129, "max_norm/layer3": 16.197643280029297, "max_norm/layer4": 16.596391677856445, "max_norm/layer5": 19.25054931640625, "max_norm/layer6": 15.518656730651855, "max_norm/layer7": 17.450822830200195, "max_norm/layer8": 17.837682723999023, "max_norm/layer9": 17.59002685546875, "mean_norm": 9.410545006394386, "mean_norm/layer0": 8.99051821231842, "mean_norm/layer1": 9.056912958621979, "mean_norm/layer10": 9.348880767822266, "mean_norm/layer11": 9.501977682113647, "mean_norm/layer12": 9.717777132987976, "mean_norm/layer13": 9.302150130271912, "mean_norm/layer14": 9.52913784980774, "mean_norm/layer15": 9.681376457214355, "mean_norm/layer16": 9.362551271915436, "mean_norm/layer17": 9.654209911823273, "mean_norm/layer18": 9.417977392673492, "mean_norm/layer19": 9.432604491710663, "mean_norm/layer2": 8.458954632282257, "mean_norm/layer20": 9.526868760585785, "mean_norm/layer21": 9.484004497528076, "mean_norm/layer22": 9.980139374732971, "mean_norm/layer23": 9.952777981758118, "mean_norm/layer3": 9.611551821231842, "mean_norm/layer4": 9.071687638759613, "mean_norm/layer5": 10.228794932365417, "mean_norm/layer6": 8.821084141731262, "mean_norm/layer7": 9.090995073318481, "mean_norm/layer8": 9.329946517944336, "mean_norm/layer9": 9.300200521945953, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3750 }, { "epoch": 1.57, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4517873149917053, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.812666177749634, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7797, "eval_samples_per_second": 20.459, "eval_steps_per_second": 0.679, "step": 3750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.59, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8196, "max_norm": 19.39119529724121, "max_norm/layer0": 16.249656677246094, "max_norm/layer1": 16.963245391845703, "max_norm/layer10": 18.125328063964844, "max_norm/layer11": 17.15520477294922, "max_norm/layer12": 17.828350067138672, "max_norm/layer13": 15.930174827575684, "max_norm/layer14": 17.422183990478516, "max_norm/layer15": 18.75629997253418, "max_norm/layer16": 16.539464950561523, "max_norm/layer17": 18.515911102294922, "max_norm/layer18": 17.11224365234375, "max_norm/layer19": 16.767332077026367, "max_norm/layer2": 14.359777450561523, "max_norm/layer20": 17.840478897094727, "max_norm/layer21": 17.309904098510742, "max_norm/layer22": 17.559303283691406, "max_norm/layer23": 17.389223098754883, "max_norm/layer3": 16.30811309814453, "max_norm/layer4": 16.692081451416016, "max_norm/layer5": 19.39119529724121, "max_norm/layer6": 15.620407104492188, "max_norm/layer7": 17.557313919067383, "max_norm/layer8": 17.944181442260742, "max_norm/layer9": 17.681028366088867, "mean_norm": 9.423318974673748, "mean_norm/layer0": 9.000839114189148, "mean_norm/layer1": 9.066909670829773, "mean_norm/layer10": 9.36047077178955, "mean_norm/layer11": 9.515274345874786, "mean_norm/layer12": 9.733893871307373, "mean_norm/layer13": 9.31408303976059, "mean_norm/layer14": 9.542948007583618, "mean_norm/layer15": 9.696711778640747, "mean_norm/layer16": 9.375279724597931, "mean_norm/layer17": 9.66939002275467, "mean_norm/layer18": 9.431337356567383, "mean_norm/layer19": 9.446298122406006, "mean_norm/layer2": 8.462641179561615, "mean_norm/layer20": 9.540704071521759, "mean_norm/layer21": 9.49764209985733, "mean_norm/layer22": 9.998992681503296, "mean_norm/layer23": 9.971072018146515, "mean_norm/layer3": 9.62577337026596, "mean_norm/layer4": 9.08018147945404, "mean_norm/layer5": 10.248691976070404, "mean_norm/layer6": 8.82778912782669, "mean_norm/layer7": 9.100020945072174, "mean_norm/layer8": 9.34142941236496, "mean_norm/layer9": 9.311281204223633, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3800 }, { "epoch": 1.59, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4525701398944606, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8062896728515625, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.533, "eval_samples_per_second": 20.896, "eval_steps_per_second": 0.694, "step": 3800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.61, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8083, "max_norm": 19.52190589904785, "max_norm/layer0": 16.348299026489258, "max_norm/layer1": 17.05620574951172, "max_norm/layer10": 18.23882293701172, "max_norm/layer11": 17.240055084228516, "max_norm/layer12": 17.929933547973633, "max_norm/layer13": 16.006711959838867, "max_norm/layer14": 17.513385772705078, "max_norm/layer15": 18.893762588500977, "max_norm/layer16": 16.633769989013672, "max_norm/layer17": 18.641620635986328, "max_norm/layer18": 17.20274543762207, "max_norm/layer19": 16.888694763183594, "max_norm/layer2": 14.43471908569336, "max_norm/layer20": 17.956628799438477, "max_norm/layer21": 17.431379318237305, "max_norm/layer22": 17.653854370117188, "max_norm/layer23": 17.478567123413086, "max_norm/layer3": 16.408828735351562, "max_norm/layer4": 16.770822525024414, "max_norm/layer5": 19.52190589904785, "max_norm/layer6": 15.692330360412598, "max_norm/layer7": 17.65044403076172, "max_norm/layer8": 18.09210777282715, "max_norm/layer9": 17.78131103515625, "mean_norm": 9.436038424571356, "mean_norm/layer0": 9.01114821434021, "mean_norm/layer1": 9.077042877674103, "mean_norm/layer10": 9.372229039669037, "mean_norm/layer11": 9.528716921806335, "mean_norm/layer12": 9.750010967254639, "mean_norm/layer13": 9.325950026512146, "mean_norm/layer14": 9.556561589241028, "mean_norm/layer15": 9.711856067180634, "mean_norm/layer16": 9.387940168380737, "mean_norm/layer17": 9.684573650360107, "mean_norm/layer18": 9.444583415985107, "mean_norm/layer19": 9.459890902042389, "mean_norm/layer2": 8.466160774230957, "mean_norm/layer20": 9.554618656635284, "mean_norm/layer21": 9.511114656925201, "mean_norm/layer22": 10.017443120479584, "mean_norm/layer23": 9.9893519282341, "mean_norm/layer3": 9.639805853366852, "mean_norm/layer4": 9.088814616203308, "mean_norm/layer5": 10.268649756908417, "mean_norm/layer6": 8.834497690200806, "mean_norm/layer7": 9.108858048915863, "mean_norm/layer8": 9.352881073951721, "mean_norm/layer9": 9.322222173213959, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3850 }, { "epoch": 1.61, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4524444011795103, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.804806709289551, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7887, "eval_samples_per_second": 20.443, "eval_steps_per_second": 0.679, "step": 3850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.63, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8202, "max_norm": 19.663883209228516, "max_norm/layer0": 16.442665100097656, "max_norm/layer1": 17.14680290222168, "max_norm/layer10": 18.334035873413086, "max_norm/layer11": 17.328901290893555, "max_norm/layer12": 18.035051345825195, "max_norm/layer13": 16.093976974487305, "max_norm/layer14": 17.588014602661133, "max_norm/layer15": 19.004194259643555, "max_norm/layer16": 16.748910903930664, "max_norm/layer17": 18.775148391723633, "max_norm/layer18": 17.282062530517578, "max_norm/layer19": 16.9793758392334, "max_norm/layer2": 14.499808311462402, "max_norm/layer20": 18.059389114379883, "max_norm/layer21": 17.545143127441406, "max_norm/layer22": 17.755186080932617, "max_norm/layer23": 17.595932006835938, "max_norm/layer3": 16.477340698242188, "max_norm/layer4": 16.84396743774414, "max_norm/layer5": 19.663883209228516, "max_norm/layer6": 15.78128433227539, "max_norm/layer7": 17.734956741333008, "max_norm/layer8": 18.204540252685547, "max_norm/layer9": 17.8907527923584, "mean_norm": 9.44852451235056, "mean_norm/layer0": 9.02129864692688, "mean_norm/layer1": 9.086955904960632, "mean_norm/layer10": 9.383722841739655, "mean_norm/layer11": 9.54167753458023, "mean_norm/layer12": 9.765829026699066, "mean_norm/layer13": 9.337481915950775, "mean_norm/layer14": 9.57017594575882, "mean_norm/layer15": 9.726840198040009, "mean_norm/layer16": 9.400262773036957, "mean_norm/layer17": 9.699501633644104, "mean_norm/layer18": 9.457594335079193, "mean_norm/layer19": 9.473425507545471, "mean_norm/layer2": 8.469590187072754, "mean_norm/layer20": 9.56819599866867, "mean_norm/layer21": 9.52423882484436, "mean_norm/layer22": 10.035979628562927, "mean_norm/layer23": 10.007273077964783, "mean_norm/layer3": 9.65359890460968, "mean_norm/layer4": 9.097174227237701, "mean_norm/layer5": 10.288195967674255, "mean_norm/layer6": 8.840922951698303, "mean_norm/layer7": 9.11753261089325, "mean_norm/layer8": 9.364024937152863, "mean_norm/layer9": 9.333094716072083, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3900 }, { "epoch": 1.63, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45347870351216624, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.798917770385742, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5468, "eval_samples_per_second": 20.872, "eval_steps_per_second": 0.693, "step": 3900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.65, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8285, "max_norm": 19.807249069213867, "max_norm/layer0": 16.5258731842041, "max_norm/layer1": 17.226022720336914, "max_norm/layer10": 18.431427001953125, "max_norm/layer11": 17.429719924926758, "max_norm/layer12": 18.14910888671875, "max_norm/layer13": 16.1771297454834, "max_norm/layer14": 17.663759231567383, "max_norm/layer15": 19.13890266418457, "max_norm/layer16": 16.864423751831055, "max_norm/layer17": 18.906938552856445, "max_norm/layer18": 17.375585556030273, "max_norm/layer19": 17.078645706176758, "max_norm/layer2": 14.565903663635254, "max_norm/layer20": 18.17165756225586, "max_norm/layer21": 17.667926788330078, "max_norm/layer22": 17.864042282104492, "max_norm/layer23": 17.719139099121094, "max_norm/layer3": 16.543764114379883, "max_norm/layer4": 16.923555374145508, "max_norm/layer5": 19.807249069213867, "max_norm/layer6": 15.881307601928711, "max_norm/layer7": 17.841663360595703, "max_norm/layer8": 18.302600860595703, "max_norm/layer9": 17.986249923706055, "mean_norm": 9.460952490568161, "mean_norm/layer0": 9.031491935253143, "mean_norm/layer1": 9.096881031990051, "mean_norm/layer10": 9.395167052745819, "mean_norm/layer11": 9.554674923419952, "mean_norm/layer12": 9.78170108795166, "mean_norm/layer13": 9.348976492881775, "mean_norm/layer14": 9.58379751443863, "mean_norm/layer15": 9.741581797599792, "mean_norm/layer16": 9.412635207176208, "mean_norm/layer17": 9.714325428009033, "mean_norm/layer18": 9.470487415790558, "mean_norm/layer19": 9.48645406961441, "mean_norm/layer2": 8.473007798194885, "mean_norm/layer20": 9.581475257873535, "mean_norm/layer21": 9.537485659122467, "mean_norm/layer22": 10.05451250076294, "mean_norm/layer23": 10.025010108947754, "mean_norm/layer3": 9.667511641979218, "mean_norm/layer4": 9.105651140213013, "mean_norm/layer5": 10.307395875453949, "mean_norm/layer6": 8.847305834293365, "mean_norm/layer7": 9.126248717308044, "mean_norm/layer8": 9.375205636024475, "mean_norm/layer9": 9.343875646591187, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 3950 }, { "epoch": 1.65, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4531826091188961, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.800121307373047, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8098, "eval_samples_per_second": 20.407, "eval_steps_per_second": 0.677, "step": 3950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.67, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8144, "max_norm": 19.9642276763916, "max_norm/layer0": 16.61147117614746, "max_norm/layer1": 17.310283660888672, "max_norm/layer10": 18.5467472076416, "max_norm/layer11": 17.51737403869629, "max_norm/layer12": 18.284799575805664, "max_norm/layer13": 16.269195556640625, "max_norm/layer14": 17.733585357666016, "max_norm/layer15": 19.260528564453125, "max_norm/layer16": 16.976835250854492, "max_norm/layer17": 19.035781860351562, "max_norm/layer18": 17.47535514831543, "max_norm/layer19": 17.174304962158203, "max_norm/layer2": 14.622349739074707, "max_norm/layer20": 18.276771545410156, "max_norm/layer21": 17.77849769592285, "max_norm/layer22": 17.960010528564453, "max_norm/layer23": 17.830236434936523, "max_norm/layer3": 16.622806549072266, "max_norm/layer4": 16.99311637878418, "max_norm/layer5": 19.9642276763916, "max_norm/layer6": 15.971922874450684, "max_norm/layer7": 17.943126678466797, "max_norm/layer8": 18.38897132873535, "max_norm/layer9": 18.076162338256836, "mean_norm": 9.473361556728682, "mean_norm/layer0": 9.041697025299072, "mean_norm/layer1": 9.106783270835876, "mean_norm/layer10": 9.40651547908783, "mean_norm/layer11": 9.567744493484497, "mean_norm/layer12": 9.79739373922348, "mean_norm/layer13": 9.360623478889465, "mean_norm/layer14": 9.59718006849289, "mean_norm/layer15": 9.75637936592102, "mean_norm/layer16": 9.424761176109314, "mean_norm/layer17": 9.729040384292603, "mean_norm/layer18": 9.483455121517181, "mean_norm/layer19": 9.499560296535492, "mean_norm/layer2": 8.476477980613708, "mean_norm/layer20": 9.594904780387878, "mean_norm/layer21": 9.55079185962677, "mean_norm/layer22": 10.07281231880188, "mean_norm/layer23": 10.042850077152252, "mean_norm/layer3": 9.681340396404266, "mean_norm/layer4": 9.11408942937851, "mean_norm/layer5": 10.326896071434021, "mean_norm/layer6": 8.85367339849472, "mean_norm/layer7": 9.134850978851318, "mean_norm/layer8": 9.386187195777893, "mean_norm/layer9": 9.354668974876404, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4000 }, { "epoch": 1.67, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45394920967133523, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.8009955883026123, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8157, "eval_samples_per_second": 20.397, "eval_steps_per_second": 0.677, "step": 4000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.69, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.818, "max_norm": 20.119094848632812, "max_norm/layer0": 16.698545455932617, "max_norm/layer1": 17.391803741455078, "max_norm/layer10": 18.6510066986084, "max_norm/layer11": 17.621688842773438, "max_norm/layer12": 18.390403747558594, "max_norm/layer13": 16.343536376953125, "max_norm/layer14": 17.814393997192383, "max_norm/layer15": 19.369619369506836, "max_norm/layer16": 17.107633590698242, "max_norm/layer17": 19.145732879638672, "max_norm/layer18": 17.571773529052734, "max_norm/layer19": 17.277477264404297, "max_norm/layer2": 14.673759460449219, "max_norm/layer20": 18.38888931274414, "max_norm/layer21": 17.876964569091797, "max_norm/layer22": 18.05607795715332, "max_norm/layer23": 17.937580108642578, "max_norm/layer3": 16.682743072509766, "max_norm/layer4": 17.070730209350586, "max_norm/layer5": 20.119094848632812, "max_norm/layer6": 16.04961585998535, "max_norm/layer7": 18.03361701965332, "max_norm/layer8": 18.491865158081055, "max_norm/layer9": 18.16168975830078, "mean_norm": 9.485714507599672, "mean_norm/layer0": 9.051836490631104, "mean_norm/layer1": 9.116701900959015, "mean_norm/layer10": 9.41792494058609, "mean_norm/layer11": 9.58076012134552, "mean_norm/layer12": 9.813140749931335, "mean_norm/layer13": 9.37224268913269, "mean_norm/layer14": 9.61046987771988, "mean_norm/layer15": 9.771362841129303, "mean_norm/layer16": 9.43696254491806, "mean_norm/layer17": 9.743814766407013, "mean_norm/layer18": 9.496419370174408, "mean_norm/layer19": 9.512612521648407, "mean_norm/layer2": 8.479991137981415, "mean_norm/layer20": 9.608174979686737, "mean_norm/layer21": 9.563690483570099, "mean_norm/layer22": 10.09063470363617, "mean_norm/layer23": 10.060266733169556, "mean_norm/layer3": 9.69506311416626, "mean_norm/layer4": 9.122413873672485, "mean_norm/layer5": 10.346292912960052, "mean_norm/layer6": 8.86014074087143, "mean_norm/layer7": 9.143555641174316, "mean_norm/layer8": 9.397226512432098, "mean_norm/layer9": 9.365448534488678, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4050 }, { "epoch": 1.69, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4548821098145151, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7933807373046875, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5572, "eval_samples_per_second": 20.853, "eval_steps_per_second": 0.692, "step": 4050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.71, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8114, "max_norm": 20.25312042236328, "max_norm/layer0": 16.780771255493164, "max_norm/layer1": 17.454378128051758, "max_norm/layer10": 18.746997833251953, "max_norm/layer11": 17.710874557495117, "max_norm/layer12": 18.502702713012695, "max_norm/layer13": 16.42099380493164, "max_norm/layer14": 17.885833740234375, "max_norm/layer15": 19.495311737060547, "max_norm/layer16": 17.204898834228516, "max_norm/layer17": 19.27667236328125, "max_norm/layer18": 17.681575775146484, "max_norm/layer19": 17.363557815551758, "max_norm/layer2": 14.722838401794434, "max_norm/layer20": 18.501394271850586, "max_norm/layer21": 17.964780807495117, "max_norm/layer22": 18.162660598754883, "max_norm/layer23": 18.065580368041992, "max_norm/layer3": 16.761926651000977, "max_norm/layer4": 17.149524688720703, "max_norm/layer5": 20.25312042236328, "max_norm/layer6": 16.114870071411133, "max_norm/layer7": 18.13249397277832, "max_norm/layer8": 18.5709285736084, "max_norm/layer9": 18.23674201965332, "mean_norm": 9.497905241946379, "mean_norm/layer0": 9.06176507472992, "mean_norm/layer1": 9.126475751399994, "mean_norm/layer10": 9.429007589817047, "mean_norm/layer11": 9.593652665615082, "mean_norm/layer12": 9.828673005104065, "mean_norm/layer13": 9.383624970912933, "mean_norm/layer14": 9.623692214488983, "mean_norm/layer15": 9.786072611808777, "mean_norm/layer16": 9.44901967048645, "mean_norm/layer17": 9.758347272872925, "mean_norm/layer18": 9.50903469324112, "mean_norm/layer19": 9.525338292121887, "mean_norm/layer2": 8.483352661132812, "mean_norm/layer20": 9.621620059013367, "mean_norm/layer21": 9.576579630374908, "mean_norm/layer22": 10.108359515666962, "mean_norm/layer23": 10.077474415302277, "mean_norm/layer3": 9.708677530288696, "mean_norm/layer4": 9.130702793598175, "mean_norm/layer5": 10.365319192409515, "mean_norm/layer6": 8.866493701934814, "mean_norm/layer7": 9.152141213417053, "mean_norm/layer8": 9.4082390666008, "mean_norm/layer9": 9.376062214374542, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4100 }, { "epoch": 1.71, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45488616590209413, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.791409730911255, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8171, "eval_samples_per_second": 20.394, "eval_steps_per_second": 0.677, "step": 4100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.73, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8119, "max_norm": 20.371471405029297, "max_norm/layer0": 16.874263763427734, "max_norm/layer1": 17.524900436401367, "max_norm/layer10": 18.839059829711914, "max_norm/layer11": 17.782032012939453, "max_norm/layer12": 18.594261169433594, "max_norm/layer13": 16.51697540283203, "max_norm/layer14": 17.984203338623047, "max_norm/layer15": 19.61891746520996, "max_norm/layer16": 17.298097610473633, "max_norm/layer17": 19.423992156982422, "max_norm/layer18": 17.77617073059082, "max_norm/layer19": 17.44768524169922, "max_norm/layer2": 14.78378677368164, "max_norm/layer20": 18.631628036499023, "max_norm/layer21": 18.048566818237305, "max_norm/layer22": 18.257789611816406, "max_norm/layer23": 18.17466926574707, "max_norm/layer3": 16.853816986083984, "max_norm/layer4": 17.234498977661133, "max_norm/layer5": 20.371471405029297, "max_norm/layer6": 16.19548797607422, "max_norm/layer7": 18.227479934692383, "max_norm/layer8": 18.656274795532227, "max_norm/layer9": 18.30875587463379, "mean_norm": 9.51002257068952, "mean_norm/layer0": 9.071641266345978, "mean_norm/layer1": 9.136261284351349, "mean_norm/layer10": 9.440190315246582, "mean_norm/layer11": 9.606357514858246, "mean_norm/layer12": 9.84403681755066, "mean_norm/layer13": 9.395072102546692, "mean_norm/layer14": 9.63693481683731, "mean_norm/layer15": 9.800684869289398, "mean_norm/layer16": 9.46108591556549, "mean_norm/layer17": 9.77271944284439, "mean_norm/layer18": 9.52157312631607, "mean_norm/layer19": 9.537791013717651, "mean_norm/layer2": 8.486609101295471, "mean_norm/layer20": 9.634786188602448, "mean_norm/layer21": 9.589442670345306, "mean_norm/layer22": 10.12604534626007, "mean_norm/layer23": 10.094537377357483, "mean_norm/layer3": 9.722192883491516, "mean_norm/layer4": 9.13902497291565, "mean_norm/layer5": 10.384238183498383, "mean_norm/layer6": 8.872731864452362, "mean_norm/layer7": 9.16065239906311, "mean_norm/layer8": 9.419233560562134, "mean_norm/layer9": 9.38669866323471, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4150 }, { "epoch": 1.73, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4547360906616696, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7870960235595703, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.795, "eval_samples_per_second": 20.432, "eval_steps_per_second": 0.678, "step": 4150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.75, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8018, "max_norm": 20.499284744262695, "max_norm/layer0": 16.95836067199707, "max_norm/layer1": 17.592952728271484, "max_norm/layer10": 18.959768295288086, "max_norm/layer11": 17.883838653564453, "max_norm/layer12": 18.69440460205078, "max_norm/layer13": 16.596149444580078, "max_norm/layer14": 18.067346572875977, "max_norm/layer15": 19.74480438232422, "max_norm/layer16": 17.383577346801758, "max_norm/layer17": 19.56295394897461, "max_norm/layer18": 17.864219665527344, "max_norm/layer19": 17.51543617248535, "max_norm/layer2": 14.8399658203125, "max_norm/layer20": 18.730480194091797, "max_norm/layer21": 18.160423278808594, "max_norm/layer22": 18.353191375732422, "max_norm/layer23": 18.279525756835938, "max_norm/layer3": 16.928646087646484, "max_norm/layer4": 17.300979614257812, "max_norm/layer5": 20.499284744262695, "max_norm/layer6": 16.267253875732422, "max_norm/layer7": 18.32831573486328, "max_norm/layer8": 18.737327575683594, "max_norm/layer9": 18.41295623779297, "mean_norm": 9.522137492895126, "mean_norm/layer0": 9.081620931625366, "mean_norm/layer1": 9.14617645740509, "mean_norm/layer10": 9.451456010341644, "mean_norm/layer11": 9.61904102563858, "mean_norm/layer12": 9.859608888626099, "mean_norm/layer13": 9.406528949737549, "mean_norm/layer14": 9.650117576122284, "mean_norm/layer15": 9.815293192863464, "mean_norm/layer16": 9.473051249980927, "mean_norm/layer17": 9.78711074590683, "mean_norm/layer18": 9.534133493900299, "mean_norm/layer19": 9.550578236579895, "mean_norm/layer2": 8.48985767364502, "mean_norm/layer20": 9.64762568473816, "mean_norm/layer21": 9.602255702018738, "mean_norm/layer22": 10.143462002277374, "mean_norm/layer23": 10.111734688282013, "mean_norm/layer3": 9.735645592212677, "mean_norm/layer4": 9.147038757801056, "mean_norm/layer5": 10.40328711271286, "mean_norm/layer6": 8.878861129283905, "mean_norm/layer7": 9.169294118881226, "mean_norm/layer8": 9.430241107940674, "mean_norm/layer9": 9.397279500961304, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4200 }, { "epoch": 1.75, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45517820420778526, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.786865711212158, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5849, "eval_samples_per_second": 20.803, "eval_steps_per_second": 0.691, "step": 4200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.77, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8143, "max_norm": 20.623327255249023, "max_norm/layer0": 17.0467529296875, "max_norm/layer1": 17.657014846801758, "max_norm/layer10": 19.062538146972656, "max_norm/layer11": 17.97028923034668, "max_norm/layer12": 18.820533752441406, "max_norm/layer13": 16.673133850097656, "max_norm/layer14": 18.132125854492188, "max_norm/layer15": 19.867862701416016, "max_norm/layer16": 17.479171752929688, "max_norm/layer17": 19.690410614013672, "max_norm/layer18": 17.983844757080078, "max_norm/layer19": 17.591114044189453, "max_norm/layer2": 14.908049583435059, "max_norm/layer20": 18.829238891601562, "max_norm/layer21": 18.25043487548828, "max_norm/layer22": 18.438114166259766, "max_norm/layer23": 18.365001678466797, "max_norm/layer3": 17.014738082885742, "max_norm/layer4": 17.379840850830078, "max_norm/layer5": 20.623327255249023, "max_norm/layer6": 16.337890625, "max_norm/layer7": 18.422710418701172, "max_norm/layer8": 18.845876693725586, "max_norm/layer9": 18.491403579711914, "mean_norm": 9.534027844667435, "mean_norm/layer0": 9.091397941112518, "mean_norm/layer1": 9.155806422233582, "mean_norm/layer10": 9.462554395198822, "mean_norm/layer11": 9.631404340267181, "mean_norm/layer12": 9.874627470970154, "mean_norm/layer13": 9.417701601982117, "mean_norm/layer14": 9.662891149520874, "mean_norm/layer15": 9.829482555389404, "mean_norm/layer16": 9.484811902046204, "mean_norm/layer17": 9.801213920116425, "mean_norm/layer18": 9.546473264694214, "mean_norm/layer19": 9.563193321228027, "mean_norm/layer2": 8.493122577667236, "mean_norm/layer20": 9.660223424434662, "mean_norm/layer21": 9.61464524269104, "mean_norm/layer22": 10.160698652267456, "mean_norm/layer23": 10.12846302986145, "mean_norm/layer3": 9.748984336853027, "mean_norm/layer4": 9.155107080936432, "mean_norm/layer5": 10.422005653381348, "mean_norm/layer6": 8.88517153263092, "mean_norm/layer7": 9.177704691886902, "mean_norm/layer8": 9.441220581531525, "mean_norm/layer9": 9.407763183116913, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4250 }, { "epoch": 1.77, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45527960639726134, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7823808193206787, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8168, "eval_samples_per_second": 20.395, "eval_steps_per_second": 0.677, "step": 4250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.8, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.801, "max_norm": 20.759300231933594, "max_norm/layer0": 17.134748458862305, "max_norm/layer1": 17.7257137298584, "max_norm/layer10": 19.151565551757812, "max_norm/layer11": 18.056488037109375, "max_norm/layer12": 18.92339324951172, "max_norm/layer13": 16.7547664642334, "max_norm/layer14": 18.19631004333496, "max_norm/layer15": 19.982650756835938, "max_norm/layer16": 17.59579849243164, "max_norm/layer17": 19.820369720458984, "max_norm/layer18": 18.083040237426758, "max_norm/layer19": 17.67841911315918, "max_norm/layer2": 14.976433753967285, "max_norm/layer20": 18.92435646057129, "max_norm/layer21": 18.350635528564453, "max_norm/layer22": 18.53485679626465, "max_norm/layer23": 18.46183967590332, "max_norm/layer3": 17.098966598510742, "max_norm/layer4": 17.442232131958008, "max_norm/layer5": 20.759300231933594, "max_norm/layer6": 16.3858699798584, "max_norm/layer7": 18.518962860107422, "max_norm/layer8": 18.962594985961914, "max_norm/layer9": 18.582992553710938, "mean_norm": 9.545886618395647, "mean_norm/layer0": 9.101129949092865, "mean_norm/layer1": 9.165426433086395, "mean_norm/layer10": 9.47351598739624, "mean_norm/layer11": 9.643661797046661, "mean_norm/layer12": 9.889671385288239, "mean_norm/layer13": 9.428849935531616, "mean_norm/layer14": 9.675801992416382, "mean_norm/layer15": 9.84381878376007, "mean_norm/layer16": 9.496441066265106, "mean_norm/layer17": 9.815237402915955, "mean_norm/layer18": 9.558767795562744, "mean_norm/layer19": 9.57570618391037, "mean_norm/layer2": 8.496287822723389, "mean_norm/layer20": 9.672922849655151, "mean_norm/layer21": 9.62732309103012, "mean_norm/layer22": 10.17811006307602, "mean_norm/layer23": 10.145203053951263, "mean_norm/layer3": 9.76219356060028, "mean_norm/layer4": 9.163109600543976, "mean_norm/layer5": 10.44065660238266, "mean_norm/layer6": 8.89125519990921, "mean_norm/layer7": 9.186071753501892, "mean_norm/layer8": 9.452130377292633, "mean_norm/layer9": 9.417986154556274, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4300 }, { "epoch": 1.8, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45536884032400027, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.780466318130493, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5429, "eval_samples_per_second": 20.879, "eval_steps_per_second": 0.693, "step": 4300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.82, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8073, "max_norm": 20.906658172607422, "max_norm/layer0": 17.20047378540039, "max_norm/layer1": 17.7962703704834, "max_norm/layer10": 19.260923385620117, "max_norm/layer11": 18.1672306060791, "max_norm/layer12": 19.01469612121582, "max_norm/layer13": 16.84528923034668, "max_norm/layer14": 18.279903411865234, "max_norm/layer15": 20.088977813720703, "max_norm/layer16": 17.689979553222656, "max_norm/layer17": 19.94285774230957, "max_norm/layer18": 18.162460327148438, "max_norm/layer19": 17.780181884765625, "max_norm/layer2": 15.040743827819824, "max_norm/layer20": 19.01894187927246, "max_norm/layer21": 18.461332321166992, "max_norm/layer22": 18.63921546936035, "max_norm/layer23": 18.553007125854492, "max_norm/layer3": 17.176898956298828, "max_norm/layer4": 17.507030487060547, "max_norm/layer5": 20.906658172607422, "max_norm/layer6": 16.445636749267578, "max_norm/layer7": 18.60109519958496, "max_norm/layer8": 19.051607131958008, "max_norm/layer9": 18.66645622253418, "mean_norm": 9.557600170373917, "mean_norm/layer0": 9.110860824584961, "mean_norm/layer1": 9.175042450428009, "mean_norm/layer10": 9.484363615512848, "mean_norm/layer11": 9.655846178531647, "mean_norm/layer12": 9.904585361480713, "mean_norm/layer13": 9.43986588716507, "mean_norm/layer14": 9.688460767269135, "mean_norm/layer15": 9.85785061120987, "mean_norm/layer16": 9.508097112178802, "mean_norm/layer17": 9.829115748405457, "mean_norm/layer18": 9.570830702781677, "mean_norm/layer19": 9.58799260854721, "mean_norm/layer2": 8.499535202980042, "mean_norm/layer20": 9.685294151306152, "mean_norm/layer21": 9.63974541425705, "mean_norm/layer22": 10.195148229598999, "mean_norm/layer23": 10.16170072555542, "mean_norm/layer3": 9.775292813777924, "mean_norm/layer4": 9.170989692211151, "mean_norm/layer5": 10.459139466285706, "mean_norm/layer6": 8.897323548793793, "mean_norm/layer7": 9.194344580173492, "mean_norm/layer8": 9.462877452373505, "mean_norm/layer9": 9.428100943565369, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4350 }, { "epoch": 1.82, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45615572131433463, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7751033306121826, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8372, "eval_samples_per_second": 20.359, "eval_steps_per_second": 0.676, "step": 4350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.84, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7988, "max_norm": 21.04453468322754, "max_norm/layer0": 17.255943298339844, "max_norm/layer1": 17.868118286132812, "max_norm/layer10": 19.348005294799805, "max_norm/layer11": 18.268312454223633, "max_norm/layer12": 19.103347778320312, "max_norm/layer13": 16.914888381958008, "max_norm/layer14": 18.352100372314453, "max_norm/layer15": 20.2009334564209, "max_norm/layer16": 17.780242919921875, "max_norm/layer17": 20.08079719543457, "max_norm/layer18": 18.235071182250977, "max_norm/layer19": 17.867902755737305, "max_norm/layer2": 15.10726261138916, "max_norm/layer20": 19.109235763549805, "max_norm/layer21": 18.55447769165039, "max_norm/layer22": 18.748037338256836, "max_norm/layer23": 18.645830154418945, "max_norm/layer3": 17.249866485595703, "max_norm/layer4": 17.581409454345703, "max_norm/layer5": 21.04453468322754, "max_norm/layer6": 16.516193389892578, "max_norm/layer7": 18.686376571655273, "max_norm/layer8": 19.148639678955078, "max_norm/layer9": 18.74429702758789, "mean_norm": 9.569357293347517, "mean_norm/layer0": 9.120525360107422, "mean_norm/layer1": 9.184691786766052, "mean_norm/layer10": 9.495336592197418, "mean_norm/layer11": 9.668105900287628, "mean_norm/layer12": 9.919475436210632, "mean_norm/layer13": 9.45104306936264, "mean_norm/layer14": 9.70114290714264, "mean_norm/layer15": 9.872009038925171, "mean_norm/layer16": 9.519804000854492, "mean_norm/layer17": 9.842991590499878, "mean_norm/layer18": 9.58296275138855, "mean_norm/layer19": 9.600463032722473, "mean_norm/layer2": 8.502758204936981, "mean_norm/layer20": 9.69754272699356, "mean_norm/layer21": 9.652194738388062, "mean_norm/layer22": 10.212375521659851, "mean_norm/layer23": 10.178341031074524, "mean_norm/layer3": 9.788307666778564, "mean_norm/layer4": 9.179190576076508, "mean_norm/layer5": 10.477513015270233, "mean_norm/layer6": 8.903360545635223, "mean_norm/layer7": 9.202587485313416, "mean_norm/layer8": 9.473590970039368, "mean_norm/layer9": 9.438261091709137, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4400 }, { "epoch": 1.84, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45590424388443396, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.775115489959717, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5853, "eval_samples_per_second": 20.802, "eval_steps_per_second": 0.691, "step": 4400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.86, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7915, "max_norm": 21.17486572265625, "max_norm/layer0": 17.298419952392578, "max_norm/layer1": 17.930343627929688, "max_norm/layer10": 19.43759536743164, "max_norm/layer11": 18.360822677612305, "max_norm/layer12": 19.205596923828125, "max_norm/layer13": 17.017274856567383, "max_norm/layer14": 18.43059730529785, "max_norm/layer15": 20.340652465820312, "max_norm/layer16": 17.854707717895508, "max_norm/layer17": 20.208559036254883, "max_norm/layer18": 18.296897888183594, "max_norm/layer19": 17.949644088745117, "max_norm/layer2": 15.163930892944336, "max_norm/layer20": 19.194684982299805, "max_norm/layer21": 18.658071517944336, "max_norm/layer22": 18.858280181884766, "max_norm/layer23": 18.766464233398438, "max_norm/layer3": 17.32754898071289, "max_norm/layer4": 17.661903381347656, "max_norm/layer5": 21.17486572265625, "max_norm/layer6": 16.588512420654297, "max_norm/layer7": 18.78378677368164, "max_norm/layer8": 19.22671890258789, "max_norm/layer9": 18.828065872192383, "mean_norm": 9.58110864708821, "mean_norm/layer0": 9.13014280796051, "mean_norm/layer1": 9.19428437948227, "mean_norm/layer10": 9.506189048290253, "mean_norm/layer11": 9.68019586801529, "mean_norm/layer12": 9.93433165550232, "mean_norm/layer13": 9.462150931358337, "mean_norm/layer14": 9.713736414909363, "mean_norm/layer15": 9.886185884475708, "mean_norm/layer16": 9.531567752361298, "mean_norm/layer17": 9.856738686561584, "mean_norm/layer18": 9.595190525054932, "mean_norm/layer19": 9.612755954265594, "mean_norm/layer2": 8.505994141101837, "mean_norm/layer20": 9.709813356399536, "mean_norm/layer21": 9.664562940597534, "mean_norm/layer22": 10.22979611158371, "mean_norm/layer23": 10.195049226284027, "mean_norm/layer3": 9.801417529582977, "mean_norm/layer4": 9.187121748924255, "mean_norm/layer5": 10.495978653430939, "mean_norm/layer6": 8.909496486186981, "mean_norm/layer7": 9.211061120033264, "mean_norm/layer8": 9.48429411649704, "mean_norm/layer9": 9.448552191257477, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4450 }, { "epoch": 1.86, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45618005783980886, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7739932537078857, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8201, "eval_samples_per_second": 20.389, "eval_steps_per_second": 0.677, "step": 4450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.88, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.8088, "max_norm": 21.288240432739258, "max_norm/layer0": 17.345314025878906, "max_norm/layer1": 18.00452423095703, "max_norm/layer10": 19.536436080932617, "max_norm/layer11": 18.446500778198242, "max_norm/layer12": 19.339845657348633, "max_norm/layer13": 17.11781120300293, "max_norm/layer14": 18.51311683654785, "max_norm/layer15": 20.480234146118164, "max_norm/layer16": 17.940902709960938, "max_norm/layer17": 20.350200653076172, "max_norm/layer18": 18.398128509521484, "max_norm/layer19": 18.029136657714844, "max_norm/layer2": 15.231613159179688, "max_norm/layer20": 19.287769317626953, "max_norm/layer21": 18.776599884033203, "max_norm/layer22": 18.979724884033203, "max_norm/layer23": 18.858877182006836, "max_norm/layer3": 17.388498306274414, "max_norm/layer4": 17.775165557861328, "max_norm/layer5": 21.288240432739258, "max_norm/layer6": 16.653141021728516, "max_norm/layer7": 18.898910522460938, "max_norm/layer8": 19.32200050354004, "max_norm/layer9": 18.906003952026367, "mean_norm": 9.592867535849413, "mean_norm/layer0": 9.139825999736786, "mean_norm/layer1": 9.20407783985138, "mean_norm/layer10": 9.517067611217499, "mean_norm/layer11": 9.692343294620514, "mean_norm/layer12": 9.94935166835785, "mean_norm/layer13": 9.473208963871002, "mean_norm/layer14": 9.726474404335022, "mean_norm/layer15": 9.900470495223999, "mean_norm/layer16": 9.54332023859024, "mean_norm/layer17": 9.870534479618073, "mean_norm/layer18": 9.60720431804657, "mean_norm/layer19": 9.625152111053467, "mean_norm/layer2": 8.509223759174347, "mean_norm/layer20": 9.722173869609833, "mean_norm/layer21": 9.67687976360321, "mean_norm/layer22": 10.246850192546844, "mean_norm/layer23": 10.211505055427551, "mean_norm/layer3": 9.814597129821777, "mean_norm/layer4": 9.194973826408386, "mean_norm/layer5": 10.514500916004181, "mean_norm/layer6": 8.915790915489197, "mean_norm/layer7": 9.219484984874725, "mean_norm/layer8": 9.49491000175476, "mean_norm/layer9": 9.458899021148682, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4500 }, { "epoch": 1.88, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.456188170014967, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7761588096618652, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8106, "eval_samples_per_second": 20.405, "eval_steps_per_second": 0.677, "step": 4500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.9, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7959, "max_norm": 21.412240982055664, "max_norm/layer0": 17.401063919067383, "max_norm/layer1": 18.084028244018555, "max_norm/layer10": 19.634403228759766, "max_norm/layer11": 18.531543731689453, "max_norm/layer12": 19.471622467041016, "max_norm/layer13": 17.196971893310547, "max_norm/layer14": 18.595664978027344, "max_norm/layer15": 20.628389358520508, "max_norm/layer16": 18.04037857055664, "max_norm/layer17": 20.481491088867188, "max_norm/layer18": 18.486473083496094, "max_norm/layer19": 18.102190017700195, "max_norm/layer2": 15.300971031188965, "max_norm/layer20": 19.38399887084961, "max_norm/layer21": 18.876100540161133, "max_norm/layer22": 19.10553550720215, "max_norm/layer23": 18.965547561645508, "max_norm/layer3": 17.45551872253418, "max_norm/layer4": 17.88532066345215, "max_norm/layer5": 21.412240982055664, "max_norm/layer6": 16.702308654785156, "max_norm/layer7": 19.0312442779541, "max_norm/layer8": 19.416467666625977, "max_norm/layer9": 19.000038146972656, "mean_norm": 9.60454748570919, "mean_norm/layer0": 9.149442195892334, "mean_norm/layer1": 9.213627398014069, "mean_norm/layer10": 9.527814865112305, "mean_norm/layer11": 9.704487025737762, "mean_norm/layer12": 9.964283287525177, "mean_norm/layer13": 9.484197497367859, "mean_norm/layer14": 9.73909717798233, "mean_norm/layer15": 9.914574265480042, "mean_norm/layer16": 9.55492353439331, "mean_norm/layer17": 9.884373843669891, "mean_norm/layer18": 9.619216859340668, "mean_norm/layer19": 9.637514412403107, "mean_norm/layer2": 8.512493133544922, "mean_norm/layer20": 9.734349429607391, "mean_norm/layer21": 9.689200222492218, "mean_norm/layer22": 10.263882875442505, "mean_norm/layer23": 10.227949321269989, "mean_norm/layer3": 9.827821612358093, "mean_norm/layer4": 9.202875196933746, "mean_norm/layer5": 10.532879412174225, "mean_norm/layer6": 8.921751141548157, "mean_norm/layer7": 9.227769911289215, "mean_norm/layer8": 9.505604028701782, "mean_norm/layer9": 9.469011008739471, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4550 }, { "epoch": 1.9, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4568898731661414, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.768836259841919, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5533, "eval_samples_per_second": 20.86, "eval_steps_per_second": 0.692, "step": 4550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.92, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7942, "max_norm": 21.53392791748047, "max_norm/layer0": 17.465423583984375, "max_norm/layer1": 18.17967414855957, "max_norm/layer10": 19.711856842041016, "max_norm/layer11": 18.609466552734375, "max_norm/layer12": 19.569843292236328, "max_norm/layer13": 17.279605865478516, "max_norm/layer14": 18.686342239379883, "max_norm/layer15": 20.776939392089844, "max_norm/layer16": 18.130950927734375, "max_norm/layer17": 20.6143741607666, "max_norm/layer18": 18.57437515258789, "max_norm/layer19": 18.213754653930664, "max_norm/layer2": 15.358172416687012, "max_norm/layer20": 19.491958618164062, "max_norm/layer21": 18.976621627807617, "max_norm/layer22": 19.238208770751953, "max_norm/layer23": 19.04021644592285, "max_norm/layer3": 17.52911376953125, "max_norm/layer4": 17.98028564453125, "max_norm/layer5": 21.53392791748047, "max_norm/layer6": 16.75553321838379, "max_norm/layer7": 19.121355056762695, "max_norm/layer8": 19.50104522705078, "max_norm/layer9": 19.088035583496094, "mean_norm": 9.616017671922842, "mean_norm/layer0": 9.158940315246582, "mean_norm/layer1": 9.223099112510681, "mean_norm/layer10": 9.538458824157715, "mean_norm/layer11": 9.716457784175873, "mean_norm/layer12": 9.978936910629272, "mean_norm/layer13": 9.49501234292984, "mean_norm/layer14": 9.751602709293365, "mean_norm/layer15": 9.92855703830719, "mean_norm/layer16": 9.566272795200348, "mean_norm/layer17": 9.897848546504974, "mean_norm/layer18": 9.630900084972382, "mean_norm/layer19": 9.649376332759857, "mean_norm/layer2": 8.51567929983139, "mean_norm/layer20": 9.746204793453217, "mean_norm/layer21": 9.70108163356781, "mean_norm/layer22": 10.280311226844788, "mean_norm/layer23": 10.244093477725983, "mean_norm/layer3": 9.840932130813599, "mean_norm/layer4": 9.21077847480774, "mean_norm/layer5": 10.55105346441269, "mean_norm/layer6": 8.927722990512848, "mean_norm/layer7": 9.2358558177948, "mean_norm/layer8": 9.51610243320465, "mean_norm/layer9": 9.479145586490631, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4600 }, { "epoch": 1.92, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45723058452278104, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7702465057373047, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8086, "eval_samples_per_second": 20.409, "eval_steps_per_second": 0.677, "step": 4600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.94, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7986, "max_norm": 21.668651580810547, "max_norm/layer0": 17.538354873657227, "max_norm/layer1": 18.273357391357422, "max_norm/layer10": 19.79624366760254, "max_norm/layer11": 18.679546356201172, "max_norm/layer12": 19.675004959106445, "max_norm/layer13": 17.357282638549805, "max_norm/layer14": 18.773691177368164, "max_norm/layer15": 20.872743606567383, "max_norm/layer16": 18.211257934570312, "max_norm/layer17": 20.737648010253906, "max_norm/layer18": 18.65184211730957, "max_norm/layer19": 18.335451126098633, "max_norm/layer2": 15.420967102050781, "max_norm/layer20": 19.6021728515625, "max_norm/layer21": 19.084949493408203, "max_norm/layer22": 19.35108184814453, "max_norm/layer23": 19.116403579711914, "max_norm/layer3": 17.621381759643555, "max_norm/layer4": 18.06914710998535, "max_norm/layer5": 21.668651580810547, "max_norm/layer6": 16.80304718017578, "max_norm/layer7": 19.21202850341797, "max_norm/layer8": 19.5865421295166, "max_norm/layer9": 19.177453994750977, "mean_norm": 9.62727957467238, "mean_norm/layer0": 9.16827380657196, "mean_norm/layer1": 9.232361853122711, "mean_norm/layer10": 9.549022853374481, "mean_norm/layer11": 9.728195488452911, "mean_norm/layer12": 9.993273079395294, "mean_norm/layer13": 9.505652070045471, "mean_norm/layer14": 9.763936638832092, "mean_norm/layer15": 9.942192792892456, "mean_norm/layer16": 9.577354550361633, "mean_norm/layer17": 9.911025285720825, "mean_norm/layer18": 9.642389118671417, "mean_norm/layer19": 9.660954356193542, "mean_norm/layer2": 8.51875525712967, "mean_norm/layer20": 9.758077919483185, "mean_norm/layer21": 9.712872505187988, "mean_norm/layer22": 10.296362459659576, "mean_norm/layer23": 10.259945154190063, "mean_norm/layer3": 9.853806853294373, "mean_norm/layer4": 9.218483328819275, "mean_norm/layer5": 10.56893503665924, "mean_norm/layer6": 8.933514535427094, "mean_norm/layer7": 9.243833124637604, "mean_norm/layer8": 9.526439189910889, "mean_norm/layer9": 9.489052534103394, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4650 }, { "epoch": 1.94, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45738065976320563, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7653119564056396, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8081, "eval_samples_per_second": 20.41, "eval_steps_per_second": 0.678, "step": 4650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.96, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7875, "max_norm": 21.812347412109375, "max_norm/layer0": 17.620792388916016, "max_norm/layer1": 18.36002540588379, "max_norm/layer10": 19.895370483398438, "max_norm/layer11": 18.755598068237305, "max_norm/layer12": 19.789051055908203, "max_norm/layer13": 17.464237213134766, "max_norm/layer14": 18.870973587036133, "max_norm/layer15": 20.999399185180664, "max_norm/layer16": 18.288803100585938, "max_norm/layer17": 20.858943939208984, "max_norm/layer18": 18.758024215698242, "max_norm/layer19": 18.439855575561523, "max_norm/layer2": 15.474851608276367, "max_norm/layer20": 19.70724868774414, "max_norm/layer21": 19.183589935302734, "max_norm/layer22": 19.45682716369629, "max_norm/layer23": 19.219196319580078, "max_norm/layer3": 17.702922821044922, "max_norm/layer4": 18.186697006225586, "max_norm/layer5": 21.812347412109375, "max_norm/layer6": 16.868118286132812, "max_norm/layer7": 19.29692268371582, "max_norm/layer8": 19.681978225708008, "max_norm/layer9": 19.25440788269043, "mean_norm": 9.638825024167696, "mean_norm/layer0": 9.17789477109909, "mean_norm/layer1": 9.24189579486847, "mean_norm/layer10": 9.559810936450958, "mean_norm/layer11": 9.74020391702652, "mean_norm/layer12": 10.008057594299316, "mean_norm/layer13": 9.51668530702591, "mean_norm/layer14": 9.776471257209778, "mean_norm/layer15": 9.956155121326447, "mean_norm/layer16": 9.58882337808609, "mean_norm/layer17": 9.924677908420563, "mean_norm/layer18": 9.654309391975403, "mean_norm/layer19": 9.672747313976288, "mean_norm/layer2": 8.521749794483185, "mean_norm/layer20": 9.769956290721893, "mean_norm/layer21": 9.724786639213562, "mean_norm/layer22": 10.312981486320496, "mean_norm/layer23": 10.276334583759308, "mean_norm/layer3": 9.866843819618225, "mean_norm/layer4": 9.22641772031784, "mean_norm/layer5": 10.587312281131744, "mean_norm/layer6": 8.939548313617706, "mean_norm/layer7": 9.252090871334076, "mean_norm/layer8": 9.536978244781494, "mean_norm/layer9": 9.499067842960358, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4700 }, { "epoch": 1.96, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45789578288574406, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7666313648223877, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6039, "eval_samples_per_second": 20.769, "eval_steps_per_second": 0.689, "step": 4700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 1.98, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7972, "max_norm": 21.965734481811523, "max_norm/layer0": 17.689268112182617, "max_norm/layer1": 18.430795669555664, "max_norm/layer10": 19.9880428314209, "max_norm/layer11": 18.836973190307617, "max_norm/layer12": 19.878585815429688, "max_norm/layer13": 17.54067039489746, "max_norm/layer14": 18.96476173400879, "max_norm/layer15": 21.133108139038086, "max_norm/layer16": 18.367586135864258, "max_norm/layer17": 20.977399826049805, "max_norm/layer18": 18.857200622558594, "max_norm/layer19": 18.525466918945312, "max_norm/layer2": 15.54166316986084, "max_norm/layer20": 19.816164016723633, "max_norm/layer21": 19.26383399963379, "max_norm/layer22": 19.56534194946289, "max_norm/layer23": 19.31981086730957, "max_norm/layer3": 17.79178810119629, "max_norm/layer4": 18.29109764099121, "max_norm/layer5": 21.965734481811523, "max_norm/layer6": 16.933610916137695, "max_norm/layer7": 19.38679313659668, "max_norm/layer8": 19.795856475830078, "max_norm/layer9": 19.338916778564453, "mean_norm": 9.650136108199755, "mean_norm/layer0": 9.18730765581131, "mean_norm/layer1": 9.251254618167877, "mean_norm/layer10": 9.570415079593658, "mean_norm/layer11": 9.752062618732452, "mean_norm/layer12": 10.022457659244537, "mean_norm/layer13": 9.527392983436584, "mean_norm/layer14": 9.788740396499634, "mean_norm/layer15": 9.969760477542877, "mean_norm/layer16": 9.600076735019684, "mean_norm/layer17": 9.938059866428375, "mean_norm/layer18": 9.66584461927414, "mean_norm/layer19": 9.68437534570694, "mean_norm/layer2": 8.524769961833954, "mean_norm/layer20": 9.78183799982071, "mean_norm/layer21": 9.736468076705933, "mean_norm/layer22": 10.328970611095428, "mean_norm/layer23": 10.292193472385406, "mean_norm/layer3": 9.879729330539703, "mean_norm/layer4": 9.234225153923035, "mean_norm/layer5": 10.605308294296265, "mean_norm/layer6": 8.945447742938995, "mean_norm/layer7": 9.260186851024628, "mean_norm/layer8": 9.547355473041534, "mean_norm/layer9": 9.509025573730469, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4750 }, { "epoch": 1.98, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4573968841135218, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7658636569976807, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5352, "eval_samples_per_second": 20.893, "eval_steps_per_second": 0.694, "step": 4750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.0, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.7549, "max_norm": 22.097200393676758, "max_norm/layer0": 17.7503719329834, "max_norm/layer1": 18.497804641723633, "max_norm/layer10": 20.086458206176758, "max_norm/layer11": 18.916461944580078, "max_norm/layer12": 19.985445022583008, "max_norm/layer13": 17.607402801513672, "max_norm/layer14": 19.063182830810547, "max_norm/layer15": 21.26007080078125, "max_norm/layer16": 18.455631256103516, "max_norm/layer17": 21.091989517211914, "max_norm/layer18": 18.967914581298828, "max_norm/layer19": 18.608983993530273, "max_norm/layer2": 15.61719036102295, "max_norm/layer20": 19.923967361450195, "max_norm/layer21": 19.351205825805664, "max_norm/layer22": 19.670289993286133, "max_norm/layer23": 19.406200408935547, "max_norm/layer3": 17.88211441040039, "max_norm/layer4": 18.38958168029785, "max_norm/layer5": 22.097200393676758, "max_norm/layer6": 16.993507385253906, "max_norm/layer7": 19.465435028076172, "max_norm/layer8": 19.875547409057617, "max_norm/layer9": 19.429819107055664, "mean_norm": 9.661303776005903, "mean_norm/layer0": 9.196622729301453, "mean_norm/layer1": 9.260469496250153, "mean_norm/layer10": 9.580876767635345, "mean_norm/layer11": 9.763825356960297, "mean_norm/layer12": 10.036564350128174, "mean_norm/layer13": 9.537844955921173, "mean_norm/layer14": 9.800962150096893, "mean_norm/layer15": 9.983208060264587, "mean_norm/layer16": 9.61099511384964, "mean_norm/layer17": 9.951125979423523, "mean_norm/layer18": 9.677132070064545, "mean_norm/layer19": 9.695655643939972, "mean_norm/layer2": 8.52772867679596, "mean_norm/layer20": 9.793645083904266, "mean_norm/layer21": 9.748089730739594, "mean_norm/layer22": 10.345001339912415, "mean_norm/layer23": 10.307753026485443, "mean_norm/layer3": 9.892489731311798, "mean_norm/layer4": 9.24187582731247, "mean_norm/layer5": 10.623258709907532, "mean_norm/layer6": 8.951395571231842, "mean_norm/layer7": 9.2682363986969, "mean_norm/layer8": 9.557595670223236, "mean_norm/layer9": 9.518938183784485, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4800 }, { "epoch": 2.0, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4563869183063401, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.770103693008423, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7952, "eval_samples_per_second": 20.432, "eval_steps_per_second": 0.678, "step": 4800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.03, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6161, "max_norm": 22.229122161865234, "max_norm/layer0": 17.81972312927246, "max_norm/layer1": 18.582639694213867, "max_norm/layer10": 20.194303512573242, "max_norm/layer11": 18.99195671081543, "max_norm/layer12": 20.07562828063965, "max_norm/layer13": 17.683574676513672, "max_norm/layer14": 19.15118408203125, "max_norm/layer15": 21.398839950561523, "max_norm/layer16": 18.56853485107422, "max_norm/layer17": 21.212589263916016, "max_norm/layer18": 19.053190231323242, "max_norm/layer19": 18.710668563842773, "max_norm/layer2": 15.681137084960938, "max_norm/layer20": 20.02528190612793, "max_norm/layer21": 19.46278190612793, "max_norm/layer22": 19.791105270385742, "max_norm/layer23": 19.512958526611328, "max_norm/layer3": 17.977426528930664, "max_norm/layer4": 18.481155395507812, "max_norm/layer5": 22.229122161865234, "max_norm/layer6": 17.07346534729004, "max_norm/layer7": 19.551734924316406, "max_norm/layer8": 19.978107452392578, "max_norm/layer9": 19.52581024169922, "mean_norm": 9.67351096123457, "mean_norm/layer0": 9.206518650054932, "mean_norm/layer1": 9.270343840122223, "mean_norm/layer10": 9.592012703418732, "mean_norm/layer11": 9.776739001274109, "mean_norm/layer12": 10.052140772342682, "mean_norm/layer13": 9.54944109916687, "mean_norm/layer14": 9.814337015151978, "mean_norm/layer15": 9.998102486133575, "mean_norm/layer16": 9.623249113559723, "mean_norm/layer17": 9.965643167495728, "mean_norm/layer18": 9.68981283903122, "mean_norm/layer19": 9.708701848983765, "mean_norm/layer2": 8.53110545873642, "mean_norm/layer20": 9.807106733322144, "mean_norm/layer21": 9.761286437511444, "mean_norm/layer22": 10.362047135829926, "mean_norm/layer23": 10.32488340139389, "mean_norm/layer3": 9.906088292598724, "mean_norm/layer4": 9.250157296657562, "mean_norm/layer5": 10.641968488693237, "mean_norm/layer6": 8.957864344120026, "mean_norm/layer7": 9.276767492294312, "mean_norm/layer8": 9.56849718093872, "mean_norm/layer9": 9.52944827079773, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4850 }, { "epoch": 2.03, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4569547705674061, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7753307819366455, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5422, "eval_samples_per_second": 20.88, "eval_steps_per_second": 0.693, "step": 4850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.05, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6189, "max_norm": 22.367904663085938, "max_norm/layer0": 17.887420654296875, "max_norm/layer1": 18.671733856201172, "max_norm/layer10": 20.304906845092773, "max_norm/layer11": 19.061819076538086, "max_norm/layer12": 20.177019119262695, "max_norm/layer13": 17.76485252380371, "max_norm/layer14": 19.243499755859375, "max_norm/layer15": 21.52268409729004, "max_norm/layer16": 18.677610397338867, "max_norm/layer17": 21.335845947265625, "max_norm/layer18": 19.159006118774414, "max_norm/layer19": 18.810163497924805, "max_norm/layer2": 15.746746063232422, "max_norm/layer20": 20.1280517578125, "max_norm/layer21": 19.575899124145508, "max_norm/layer22": 19.892805099487305, "max_norm/layer23": 19.60469627380371, "max_norm/layer3": 18.071157455444336, "max_norm/layer4": 18.57114601135254, "max_norm/layer5": 22.367904663085938, "max_norm/layer6": 17.15428924560547, "max_norm/layer7": 19.633804321289062, "max_norm/layer8": 20.081315994262695, "max_norm/layer9": 19.6232967376709, "mean_norm": 9.685750077168146, "mean_norm/layer0": 9.217075943946838, "mean_norm/layer1": 9.280148386955261, "mean_norm/layer10": 9.603125274181366, "mean_norm/layer11": 9.789462864398956, "mean_norm/layer12": 10.067663490772247, "mean_norm/layer13": 9.561099231243134, "mean_norm/layer14": 9.827849328517914, "mean_norm/layer15": 10.012909770011902, "mean_norm/layer16": 9.635309100151062, "mean_norm/layer17": 9.979934573173523, "mean_norm/layer18": 9.702326834201813, "mean_norm/layer19": 9.721765398979187, "mean_norm/layer2": 8.534556448459625, "mean_norm/layer20": 9.820671617984772, "mean_norm/layer21": 9.774718105793, "mean_norm/layer22": 10.379175782203674, "mean_norm/layer23": 10.342072427272797, "mean_norm/layer3": 9.919848799705505, "mean_norm/layer4": 9.25857150554657, "mean_norm/layer5": 10.660731792449951, "mean_norm/layer6": 8.964467108249664, "mean_norm/layer7": 9.285303235054016, "mean_norm/layer8": 9.579225778579712, "mean_norm/layer9": 9.539989054203033, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4900 }, { "epoch": 2.05, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45636663786844484, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.778195858001709, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5841, "eval_samples_per_second": 20.804, "eval_steps_per_second": 0.691, "step": 4900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.07, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6266, "max_norm": 22.497936248779297, "max_norm/layer0": 17.95612144470215, "max_norm/layer1": 18.766647338867188, "max_norm/layer10": 20.393529891967773, "max_norm/layer11": 19.140981674194336, "max_norm/layer12": 20.30097198486328, "max_norm/layer13": 17.845705032348633, "max_norm/layer14": 19.33021354675293, "max_norm/layer15": 21.635671615600586, "max_norm/layer16": 18.780454635620117, "max_norm/layer17": 21.467220306396484, "max_norm/layer18": 19.249921798706055, "max_norm/layer19": 18.916114807128906, "max_norm/layer2": 15.8043794631958, "max_norm/layer20": 20.2207088470459, "max_norm/layer21": 19.68240737915039, "max_norm/layer22": 20.003076553344727, "max_norm/layer23": 19.702362060546875, "max_norm/layer3": 18.159029006958008, "max_norm/layer4": 18.67041015625, "max_norm/layer5": 22.497936248779297, "max_norm/layer6": 17.22257423400879, "max_norm/layer7": 19.70867156982422, "max_norm/layer8": 20.17713165283203, "max_norm/layer9": 19.7199764251709, "mean_norm": 9.698031273980936, "mean_norm/layer0": 9.2280832529068, "mean_norm/layer1": 9.29011619091034, "mean_norm/layer10": 9.614328265190125, "mean_norm/layer11": 9.802447438240051, "mean_norm/layer12": 10.083309292793274, "mean_norm/layer13": 9.572734773159027, "mean_norm/layer14": 9.841307997703552, "mean_norm/layer15": 10.027710676193237, "mean_norm/layer16": 9.647395431995392, "mean_norm/layer17": 9.994074761867523, "mean_norm/layer18": 9.714804410934448, "mean_norm/layer19": 9.73473072052002, "mean_norm/layer2": 8.538142025470734, "mean_norm/layer20": 9.833818078041077, "mean_norm/layer21": 9.787812173366547, "mean_norm/layer22": 10.39659869670868, "mean_norm/layer23": 10.359000742435455, "mean_norm/layer3": 9.933819353580475, "mean_norm/layer4": 9.267073810100555, "mean_norm/layer5": 10.679556548595428, "mean_norm/layer6": 8.971089124679565, "mean_norm/layer7": 9.293950021266937, "mean_norm/layer8": 9.59020709991455, "mean_norm/layer9": 9.550639688968658, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 4950 }, { "epoch": 2.07, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45755507152910446, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.778442859649658, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.7905, "eval_samples_per_second": 22.334, "eval_steps_per_second": 0.741, "step": 4950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.09, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6468, "max_norm": 22.62725257873535, "max_norm/layer0": 18.031448364257812, "max_norm/layer1": 18.85249137878418, "max_norm/layer10": 20.487457275390625, "max_norm/layer11": 19.27031898498535, "max_norm/layer12": 20.434553146362305, "max_norm/layer13": 17.91874122619629, "max_norm/layer14": 19.41231346130371, "max_norm/layer15": 21.761850357055664, "max_norm/layer16": 18.886045455932617, "max_norm/layer17": 21.617713928222656, "max_norm/layer18": 19.34942626953125, "max_norm/layer19": 19.026630401611328, "max_norm/layer2": 15.86556339263916, "max_norm/layer20": 20.321598052978516, "max_norm/layer21": 19.79185676574707, "max_norm/layer22": 20.136564254760742, "max_norm/layer23": 19.804283142089844, "max_norm/layer3": 18.258943557739258, "max_norm/layer4": 18.755266189575195, "max_norm/layer5": 22.62725257873535, "max_norm/layer6": 17.279165267944336, "max_norm/layer7": 19.7928466796875, "max_norm/layer8": 20.278255462646484, "max_norm/layer9": 19.814647674560547, "mean_norm": 9.71029263238112, "mean_norm/layer0": 9.239352583885193, "mean_norm/layer1": 9.300042927265167, "mean_norm/layer10": 9.625477373600006, "mean_norm/layer11": 9.815385699272156, "mean_norm/layer12": 10.098966121673584, "mean_norm/layer13": 9.584208488464355, "mean_norm/layer14": 9.854663968086243, "mean_norm/layer15": 10.042455911636353, "mean_norm/layer16": 9.659296989440918, "mean_norm/layer17": 10.008129358291626, "mean_norm/layer18": 9.727139055728912, "mean_norm/layer19": 9.74753886461258, "mean_norm/layer2": 8.541776299476624, "mean_norm/layer20": 9.846904814243317, "mean_norm/layer21": 9.800666272640228, "mean_norm/layer22": 10.414086759090424, "mean_norm/layer23": 10.375837922096252, "mean_norm/layer3": 9.947814524173737, "mean_norm/layer4": 9.275640845298767, "mean_norm/layer5": 10.698535740375519, "mean_norm/layer6": 8.977764904499054, "mean_norm/layer7": 9.302622854709625, "mean_norm/layer8": 9.601214170455933, "mean_norm/layer9": 9.56150072813034, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5000 }, { "epoch": 2.09, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4572954819240457, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7788991928100586, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8093, "eval_samples_per_second": 20.408, "eval_steps_per_second": 0.677, "step": 5000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.11, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6487, "max_norm": 22.76466941833496, "max_norm/layer0": 18.100759506225586, "max_norm/layer1": 18.94605827331543, "max_norm/layer10": 20.581647872924805, "max_norm/layer11": 19.369783401489258, "max_norm/layer12": 20.52696990966797, "max_norm/layer13": 17.98175048828125, "max_norm/layer14": 19.488126754760742, "max_norm/layer15": 21.85770034790039, "max_norm/layer16": 18.97614860534668, "max_norm/layer17": 21.745214462280273, "max_norm/layer18": 19.442224502563477, "max_norm/layer19": 19.127676010131836, "max_norm/layer2": 15.919937133789062, "max_norm/layer20": 20.431379318237305, "max_norm/layer21": 19.900375366210938, "max_norm/layer22": 20.263553619384766, "max_norm/layer23": 19.90934181213379, "max_norm/layer3": 18.351699829101562, "max_norm/layer4": 18.841182708740234, "max_norm/layer5": 22.76466941833496, "max_norm/layer6": 17.338943481445312, "max_norm/layer7": 19.896106719970703, "max_norm/layer8": 20.378662109375, "max_norm/layer9": 19.90271759033203, "mean_norm": 9.722342488666376, "mean_norm/layer0": 9.250700294971466, "mean_norm/layer1": 9.309888064861298, "mean_norm/layer10": 9.63647472858429, "mean_norm/layer11": 9.828037559986115, "mean_norm/layer12": 10.114314317703247, "mean_norm/layer13": 9.595680236816406, "mean_norm/layer14": 9.86775666475296, "mean_norm/layer15": 10.057121217250824, "mean_norm/layer16": 9.671030879020691, "mean_norm/layer17": 10.021993637084961, "mean_norm/layer18": 9.739132702350616, "mean_norm/layer19": 9.759905397891998, "mean_norm/layer2": 8.54540067911148, "mean_norm/layer20": 9.859400808811188, "mean_norm/layer21": 9.81334936618805, "mean_norm/layer22": 10.431015074253082, "mean_norm/layer23": 10.392397820949554, "mean_norm/layer3": 9.961604416370392, "mean_norm/layer4": 9.284013032913208, "mean_norm/layer5": 10.717323243618011, "mean_norm/layer6": 8.984280347824097, "mean_norm/layer7": 9.311186790466309, "mean_norm/layer8": 9.612077295780182, "mean_norm/layer9": 9.572135150432587, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5050 }, { "epoch": 2.11, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45699938753077557, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7762091159820557, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8214, "eval_samples_per_second": 20.387, "eval_steps_per_second": 0.677, "step": 5050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.13, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6467, "max_norm": 22.89735984802246, "max_norm/layer0": 18.166860580444336, "max_norm/layer1": 19.054595947265625, "max_norm/layer10": 20.66739845275879, "max_norm/layer11": 19.451705932617188, "max_norm/layer12": 20.62177848815918, "max_norm/layer13": 18.060523986816406, "max_norm/layer14": 19.57383155822754, "max_norm/layer15": 21.97449493408203, "max_norm/layer16": 19.052349090576172, "max_norm/layer17": 21.87696647644043, "max_norm/layer18": 19.54570770263672, "max_norm/layer19": 19.23660659790039, "max_norm/layer2": 15.98861026763916, "max_norm/layer20": 20.53759002685547, "max_norm/layer21": 20.000146865844727, "max_norm/layer22": 20.37427520751953, "max_norm/layer23": 20.004507064819336, "max_norm/layer3": 18.47233772277832, "max_norm/layer4": 18.915876388549805, "max_norm/layer5": 22.89735984802246, "max_norm/layer6": 17.400609970092773, "max_norm/layer7": 19.98491668701172, "max_norm/layer8": 20.48213005065918, "max_norm/layer9": 20.012739181518555, "mean_norm": 9.734544103344282, "mean_norm/layer0": 9.2623251080513, "mean_norm/layer1": 9.320045828819275, "mean_norm/layer10": 9.647578060626984, "mean_norm/layer11": 9.840642750263214, "mean_norm/layer12": 10.129788398742676, "mean_norm/layer13": 9.607102155685425, "mean_norm/layer14": 9.88111037015915, "mean_norm/layer15": 10.071675181388855, "mean_norm/layer16": 9.682976722717285, "mean_norm/layer17": 10.03602159023285, "mean_norm/layer18": 9.751314342021942, "mean_norm/layer19": 9.7725231051445, "mean_norm/layer2": 8.549007654190063, "mean_norm/layer20": 9.87232106924057, "mean_norm/layer21": 9.826198995113373, "mean_norm/layer22": 10.448007762432098, "mean_norm/layer23": 10.409220039844513, "mean_norm/layer3": 9.975856363773346, "mean_norm/layer4": 9.29235965013504, "mean_norm/layer5": 10.736477971076965, "mean_norm/layer6": 8.990878164768219, "mean_norm/layer7": 9.319936335086823, "mean_norm/layer8": 9.622983694076538, "mean_norm/layer9": 9.582707166671753, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5100 }, { "epoch": 2.13, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4562327869783364, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.777289628982544, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5722, "eval_samples_per_second": 20.826, "eval_steps_per_second": 0.691, "step": 5100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.15, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6599, "max_norm": 23.004852294921875, "max_norm/layer0": 18.246042251586914, "max_norm/layer1": 19.173181533813477, "max_norm/layer10": 20.759347915649414, "max_norm/layer11": 19.53813362121582, "max_norm/layer12": 20.722137451171875, "max_norm/layer13": 18.14091682434082, "max_norm/layer14": 19.650548934936523, "max_norm/layer15": 22.08029556274414, "max_norm/layer16": 19.13140869140625, "max_norm/layer17": 22.015832901000977, "max_norm/layer18": 19.6434268951416, "max_norm/layer19": 19.330032348632812, "max_norm/layer2": 16.050338745117188, "max_norm/layer20": 20.631410598754883, "max_norm/layer21": 20.11321258544922, "max_norm/layer22": 20.477571487426758, "max_norm/layer23": 20.0946102142334, "max_norm/layer3": 18.563167572021484, "max_norm/layer4": 19.002338409423828, "max_norm/layer5": 23.004852294921875, "max_norm/layer6": 17.46533966064453, "max_norm/layer7": 20.085609436035156, "max_norm/layer8": 20.567922592163086, "max_norm/layer9": 20.1201229095459, "mean_norm": 9.746603799362978, "mean_norm/layer0": 9.273974597454071, "mean_norm/layer1": 9.330005407333374, "mean_norm/layer10": 9.658581376075745, "mean_norm/layer11": 9.853312253952026, "mean_norm/layer12": 10.145055592060089, "mean_norm/layer13": 9.618417501449585, "mean_norm/layer14": 9.894328236579895, "mean_norm/layer15": 10.086170971393585, "mean_norm/layer16": 9.694756627082825, "mean_norm/layer17": 10.049719512462616, "mean_norm/layer18": 9.76311081647873, "mean_norm/layer19": 9.784685909748077, "mean_norm/layer2": 8.552568674087524, "mean_norm/layer20": 9.884812831878662, "mean_norm/layer21": 9.83890050649643, "mean_norm/layer22": 10.464799404144287, "mean_norm/layer23": 10.425880491733551, "mean_norm/layer3": 9.98993718624115, "mean_norm/layer4": 9.300775229930878, "mean_norm/layer5": 10.755446791648865, "mean_norm/layer6": 8.997404158115387, "mean_norm/layer7": 9.328621327877045, "mean_norm/layer8": 9.63390564918518, "mean_norm/layer9": 9.59332013130188, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5150 }, { "epoch": 2.15, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4562287308907574, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7837729454040527, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8574, "eval_samples_per_second": 20.325, "eval_steps_per_second": 0.675, "step": 5150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.17, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6557, "max_norm": 23.14448356628418, "max_norm/layer0": 18.320140838623047, "max_norm/layer1": 19.293155670166016, "max_norm/layer10": 20.861385345458984, "max_norm/layer11": 19.622970581054688, "max_norm/layer12": 20.83387565612793, "max_norm/layer13": 18.22727394104004, "max_norm/layer14": 19.7342586517334, "max_norm/layer15": 22.176088333129883, "max_norm/layer16": 19.23335075378418, "max_norm/layer17": 22.15247917175293, "max_norm/layer18": 19.74405860900879, "max_norm/layer19": 19.428447723388672, "max_norm/layer2": 16.106197357177734, "max_norm/layer20": 20.740074157714844, "max_norm/layer21": 20.21061897277832, "max_norm/layer22": 20.575672149658203, "max_norm/layer23": 20.196548461914062, "max_norm/layer3": 18.64171600341797, "max_norm/layer4": 19.0919132232666, "max_norm/layer5": 23.14448356628418, "max_norm/layer6": 17.518203735351562, "max_norm/layer7": 20.20140838623047, "max_norm/layer8": 20.656841278076172, "max_norm/layer9": 20.232519149780273, "mean_norm": 9.758909354607264, "mean_norm/layer0": 9.285945355892181, "mean_norm/layer1": 9.340204358100891, "mean_norm/layer10": 9.669862568378448, "mean_norm/layer11": 9.86609172821045, "mean_norm/layer12": 10.160631120204926, "mean_norm/layer13": 9.630088806152344, "mean_norm/layer14": 9.907589554786682, "mean_norm/layer15": 10.100898385047913, "mean_norm/layer16": 9.706718385219574, "mean_norm/layer17": 10.063713669776917, "mean_norm/layer18": 9.77525269985199, "mean_norm/layer19": 9.797052562236786, "mean_norm/layer2": 8.556278944015503, "mean_norm/layer20": 9.89769971370697, "mean_norm/layer21": 9.851765871047974, "mean_norm/layer22": 10.482112884521484, "mean_norm/layer23": 10.442677736282349, "mean_norm/layer3": 10.004293620586395, "mean_norm/layer4": 9.30946832895279, "mean_norm/layer5": 10.774869859218597, "mean_norm/layer6": 9.004033982753754, "mean_norm/layer7": 9.337443828582764, "mean_norm/layer8": 9.644962728023529, "mean_norm/layer9": 9.604167819023132, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5200 }, { "epoch": 2.17, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45675602227603296, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7779088020324707, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8191, "eval_samples_per_second": 20.391, "eval_steps_per_second": 0.677, "step": 5200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.19, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6622, "max_norm": 23.266572952270508, "max_norm/layer0": 18.395366668701172, "max_norm/layer1": 19.405048370361328, "max_norm/layer10": 20.944896697998047, "max_norm/layer11": 19.703922271728516, "max_norm/layer12": 20.931015014648438, "max_norm/layer13": 18.32317543029785, "max_norm/layer14": 19.821910858154297, "max_norm/layer15": 22.291412353515625, "max_norm/layer16": 19.31391716003418, "max_norm/layer17": 22.261930465698242, "max_norm/layer18": 19.85706901550293, "max_norm/layer19": 19.519027709960938, "max_norm/layer2": 16.164764404296875, "max_norm/layer20": 20.836637496948242, "max_norm/layer21": 20.297468185424805, "max_norm/layer22": 20.689680099487305, "max_norm/layer23": 20.2936954498291, "max_norm/layer3": 18.744632720947266, "max_norm/layer4": 19.17936897277832, "max_norm/layer5": 23.266572952270508, "max_norm/layer6": 17.58405876159668, "max_norm/layer7": 20.27602195739746, "max_norm/layer8": 20.73196029663086, "max_norm/layer9": 20.32901382446289, "mean_norm": 9.770990287264189, "mean_norm/layer0": 9.297839343547821, "mean_norm/layer1": 9.350374460220337, "mean_norm/layer10": 9.681010365486145, "mean_norm/layer11": 9.878672003746033, "mean_norm/layer12": 10.175971269607544, "mean_norm/layer13": 9.64153653383255, "mean_norm/layer14": 9.920740842819214, "mean_norm/layer15": 10.1153604388237, "mean_norm/layer16": 9.718545377254486, "mean_norm/layer17": 10.077604353427887, "mean_norm/layer18": 9.787011325359344, "mean_norm/layer19": 9.809286177158356, "mean_norm/layer2": 8.559925496578217, "mean_norm/layer20": 9.910324573516846, "mean_norm/layer21": 9.864007830619812, "mean_norm/layer22": 10.498671770095825, "mean_norm/layer23": 10.459164440631866, "mean_norm/layer3": 10.01849776506424, "mean_norm/layer4": 9.317963421344757, "mean_norm/layer5": 10.793861210346222, "mean_norm/layer6": 9.010525822639465, "mean_norm/layer7": 9.346060633659363, "mean_norm/layer8": 9.655949771404266, "mean_norm/layer9": 9.61486166715622, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5250 }, { "epoch": 2.19, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4562327869783364, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7806594371795654, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8078, "eval_samples_per_second": 20.41, "eval_steps_per_second": 0.678, "step": 5250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.21, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6863, "max_norm": 23.383268356323242, "max_norm/layer0": 18.473617553710938, "max_norm/layer1": 19.516151428222656, "max_norm/layer10": 21.03118324279785, "max_norm/layer11": 19.796005249023438, "max_norm/layer12": 21.034351348876953, "max_norm/layer13": 18.400510787963867, "max_norm/layer14": 19.89116859436035, "max_norm/layer15": 22.391456604003906, "max_norm/layer16": 19.405385971069336, "max_norm/layer17": 22.3623046875, "max_norm/layer18": 19.993558883666992, "max_norm/layer19": 19.62684440612793, "max_norm/layer2": 16.235048294067383, "max_norm/layer20": 20.942127227783203, "max_norm/layer21": 20.385709762573242, "max_norm/layer22": 20.807687759399414, "max_norm/layer23": 20.388404846191406, "max_norm/layer3": 18.837236404418945, "max_norm/layer4": 19.27210235595703, "max_norm/layer5": 23.383268356323242, "max_norm/layer6": 17.637849807739258, "max_norm/layer7": 20.35446548461914, "max_norm/layer8": 20.819650650024414, "max_norm/layer9": 20.413063049316406, "mean_norm": 9.782849095761776, "mean_norm/layer0": 9.30956506729126, "mean_norm/layer1": 9.360318064689636, "mean_norm/layer10": 9.691880643367767, "mean_norm/layer11": 9.891013085842133, "mean_norm/layer12": 10.190861105918884, "mean_norm/layer13": 9.652708292007446, "mean_norm/layer14": 9.933558821678162, "mean_norm/layer15": 10.129729926586151, "mean_norm/layer16": 9.730214476585388, "mean_norm/layer17": 10.091246604919434, "mean_norm/layer18": 9.79846078157425, "mean_norm/layer19": 9.821033775806427, "mean_norm/layer2": 8.563501000404358, "mean_norm/layer20": 9.922536730766296, "mean_norm/layer21": 9.876113593578339, "mean_norm/layer22": 10.515062034130096, "mean_norm/layer23": 10.47534316778183, "mean_norm/layer3": 10.032526850700378, "mean_norm/layer4": 9.326524913311005, "mean_norm/layer5": 10.812679052352905, "mean_norm/layer6": 9.016940891742706, "mean_norm/layer7": 9.354610204696655, "mean_norm/layer8": 9.666627705097198, "mean_norm/layer9": 9.625321507453918, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5300 }, { "epoch": 2.21, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45746178151478645, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7769699096679688, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.555, "eval_samples_per_second": 20.857, "eval_steps_per_second": 0.692, "step": 5300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.23, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.679, "max_norm": 23.499439239501953, "max_norm/layer0": 18.54343032836914, "max_norm/layer1": 19.622438430786133, "max_norm/layer10": 21.115442276000977, "max_norm/layer11": 19.91941261291504, "max_norm/layer12": 21.136581420898438, "max_norm/layer13": 18.484241485595703, "max_norm/layer14": 19.956186294555664, "max_norm/layer15": 22.505870819091797, "max_norm/layer16": 19.49273109436035, "max_norm/layer17": 22.469552993774414, "max_norm/layer18": 20.106782913208008, "max_norm/layer19": 19.725515365600586, "max_norm/layer2": 16.305809020996094, "max_norm/layer20": 21.03738021850586, "max_norm/layer21": 20.470613479614258, "max_norm/layer22": 20.912168502807617, "max_norm/layer23": 20.484712600708008, "max_norm/layer3": 18.927547454833984, "max_norm/layer4": 19.371742248535156, "max_norm/layer5": 23.499439239501953, "max_norm/layer6": 17.688518524169922, "max_norm/layer7": 20.45281219482422, "max_norm/layer8": 20.927034378051758, "max_norm/layer9": 20.496910095214844, "mean_norm": 9.794714162747065, "mean_norm/layer0": 9.321279466152191, "mean_norm/layer1": 9.370379328727722, "mean_norm/layer10": 9.702701926231384, "mean_norm/layer11": 9.903493821620941, "mean_norm/layer12": 10.205870807170868, "mean_norm/layer13": 9.66382622718811, "mean_norm/layer14": 9.94619619846344, "mean_norm/layer15": 10.14408254623413, "mean_norm/layer16": 9.741806030273438, "mean_norm/layer17": 10.104702532291412, "mean_norm/layer18": 9.809928119182587, "mean_norm/layer19": 9.832951545715332, "mean_norm/layer2": 8.567113637924194, "mean_norm/layer20": 9.934588551521301, "mean_norm/layer21": 9.888190269470215, "mean_norm/layer22": 10.531676888465881, "mean_norm/layer23": 10.491473019123077, "mean_norm/layer3": 10.046574115753174, "mean_norm/layer4": 9.33499801158905, "mean_norm/layer5": 10.831702411174774, "mean_norm/layer6": 9.023348093032837, "mean_norm/layer7": 9.363218486309052, "mean_norm/layer8": 9.677422285079956, "mean_norm/layer9": 9.635615587234497, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5350 }, { "epoch": 2.23, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4568695927282462, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.774198055267334, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8138, "eval_samples_per_second": 20.4, "eval_steps_per_second": 0.677, "step": 5350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.25, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6657, "max_norm": 23.616012573242188, "max_norm/layer0": 18.616952896118164, "max_norm/layer1": 19.73339080810547, "max_norm/layer10": 21.219606399536133, "max_norm/layer11": 20.00966453552246, "max_norm/layer12": 21.244117736816406, "max_norm/layer13": 18.585554122924805, "max_norm/layer14": 20.035675048828125, "max_norm/layer15": 22.61372947692871, "max_norm/layer16": 19.60413360595703, "max_norm/layer17": 22.56954574584961, "max_norm/layer18": 20.213354110717773, "max_norm/layer19": 19.81522560119629, "max_norm/layer2": 16.383325576782227, "max_norm/layer20": 21.13914680480957, "max_norm/layer21": 20.564655303955078, "max_norm/layer22": 21.007658004760742, "max_norm/layer23": 20.579490661621094, "max_norm/layer3": 19.023515701293945, "max_norm/layer4": 19.47603416442871, "max_norm/layer5": 23.616012573242188, "max_norm/layer6": 17.729270935058594, "max_norm/layer7": 20.534603118896484, "max_norm/layer8": 21.014896392822266, "max_norm/layer9": 20.589609146118164, "mean_norm": 9.806618705391884, "mean_norm/layer0": 9.33316719532013, "mean_norm/layer1": 9.38050252199173, "mean_norm/layer10": 9.713618159294128, "mean_norm/layer11": 9.915963411331177, "mean_norm/layer12": 10.220970749855042, "mean_norm/layer13": 9.674981594085693, "mean_norm/layer14": 9.959041476249695, "mean_norm/layer15": 10.158335328102112, "mean_norm/layer16": 9.753474414348602, "mean_norm/layer17": 10.118220508098602, "mean_norm/layer18": 9.821493268013, "mean_norm/layer19": 9.844790577888489, "mean_norm/layer2": 8.570688605308533, "mean_norm/layer20": 9.946804225444794, "mean_norm/layer21": 9.90015572309494, "mean_norm/layer22": 10.548267424106598, "mean_norm/layer23": 10.507667362689972, "mean_norm/layer3": 10.06048858165741, "mean_norm/layer4": 9.343421339988708, "mean_norm/layer5": 10.850700914859772, "mean_norm/layer6": 9.029772937297821, "mean_norm/layer7": 9.37190467119217, "mean_norm/layer8": 9.68824589252472, "mean_norm/layer9": 9.646172046661377, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5400 }, { "epoch": 2.25, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45795662419942973, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.773238182067871, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8161, "eval_samples_per_second": 20.396, "eval_steps_per_second": 0.677, "step": 5400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.28, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6707, "max_norm": 23.711584091186523, "max_norm/layer0": 18.696035385131836, "max_norm/layer1": 19.86383628845215, "max_norm/layer10": 21.319568634033203, "max_norm/layer11": 20.104448318481445, "max_norm/layer12": 21.343198776245117, "max_norm/layer13": 18.65641212463379, "max_norm/layer14": 20.11650848388672, "max_norm/layer15": 22.714111328125, "max_norm/layer16": 19.710603713989258, "max_norm/layer17": 22.677001953125, "max_norm/layer18": 20.324527740478516, "max_norm/layer19": 19.905961990356445, "max_norm/layer2": 16.444032669067383, "max_norm/layer20": 21.24724769592285, "max_norm/layer21": 20.659025192260742, "max_norm/layer22": 21.11807632446289, "max_norm/layer23": 20.669883728027344, "max_norm/layer3": 19.120800018310547, "max_norm/layer4": 19.565460205078125, "max_norm/layer5": 23.711584091186523, "max_norm/layer6": 17.779829025268555, "max_norm/layer7": 20.61775016784668, "max_norm/layer8": 21.11190414428711, "max_norm/layer9": 20.662193298339844, "mean_norm": 9.81824733565251, "mean_norm/layer0": 9.344789624214172, "mean_norm/layer1": 9.390469372272491, "mean_norm/layer10": 9.724392533302307, "mean_norm/layer11": 9.928160071372986, "mean_norm/layer12": 10.235535979270935, "mean_norm/layer13": 9.685753464698792, "mean_norm/layer14": 9.971448719501495, "mean_norm/layer15": 10.172397494316101, "mean_norm/layer16": 9.764802813529968, "mean_norm/layer17": 10.131413161754608, "mean_norm/layer18": 9.832902252674103, "mean_norm/layer19": 9.856505811214447, "mean_norm/layer2": 8.574154257774353, "mean_norm/layer20": 9.958525598049164, "mean_norm/layer21": 9.912037432193756, "mean_norm/layer22": 10.564294755458832, "mean_norm/layer23": 10.523465871810913, "mean_norm/layer3": 10.074239313602448, "mean_norm/layer4": 9.351719319820404, "mean_norm/layer5": 10.869217932224274, "mean_norm/layer6": 9.036074459552765, "mean_norm/layer7": 9.380382359027863, "mean_norm/layer8": 9.698756694793701, "mean_norm/layer9": 9.65649676322937, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5450 }, { "epoch": 2.28, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4583906255703873, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.767972230911255, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5723, "eval_samples_per_second": 20.826, "eval_steps_per_second": 0.691, "step": 5450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.3, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6828, "max_norm": 23.828529357910156, "max_norm/layer0": 18.77942657470703, "max_norm/layer1": 19.9698486328125, "max_norm/layer10": 21.414457321166992, "max_norm/layer11": 20.17760467529297, "max_norm/layer12": 21.42694854736328, "max_norm/layer13": 18.734359741210938, "max_norm/layer14": 20.196672439575195, "max_norm/layer15": 22.838233947753906, "max_norm/layer16": 19.811031341552734, "max_norm/layer17": 22.79621696472168, "max_norm/layer18": 20.419069290161133, "max_norm/layer19": 20.007299423217773, "max_norm/layer2": 16.4896183013916, "max_norm/layer20": 21.348735809326172, "max_norm/layer21": 20.764799118041992, "max_norm/layer22": 21.221994400024414, "max_norm/layer23": 20.771209716796875, "max_norm/layer3": 19.219717025756836, "max_norm/layer4": 19.63283348083496, "max_norm/layer5": 23.828529357910156, "max_norm/layer6": 17.82144546508789, "max_norm/layer7": 20.713653564453125, "max_norm/layer8": 21.195741653442383, "max_norm/layer9": 20.749263763427734, "mean_norm": 9.829934562246004, "mean_norm/layer0": 9.356457650661469, "mean_norm/layer1": 9.400355875492096, "mean_norm/layer10": 9.735199213027954, "mean_norm/layer11": 9.940261006355286, "mean_norm/layer12": 10.250323474407196, "mean_norm/layer13": 9.696837365627289, "mean_norm/layer14": 9.98394638299942, "mean_norm/layer15": 10.186484932899475, "mean_norm/layer16": 9.776153683662415, "mean_norm/layer17": 10.144715905189514, "mean_norm/layer18": 9.844414174556732, "mean_norm/layer19": 9.86827665567398, "mean_norm/layer2": 8.577622711658478, "mean_norm/layer20": 9.970131814479828, "mean_norm/layer21": 9.923815429210663, "mean_norm/layer22": 10.580283641815186, "mean_norm/layer23": 10.539456129074097, "mean_norm/layer3": 10.088192164897919, "mean_norm/layer4": 9.360041677951813, "mean_norm/layer5": 10.888111174106598, "mean_norm/layer6": 9.042340636253357, "mean_norm/layer7": 9.388883471488953, "mean_norm/layer8": 9.709352374076843, "mean_norm/layer9": 9.666771948337555, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5500 }, { "epoch": 2.3, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45791200723606024, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7675321102142334, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8324, "eval_samples_per_second": 20.368, "eval_steps_per_second": 0.676, "step": 5500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.32, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.669, "max_norm": 23.937562942504883, "max_norm/layer0": 18.859041213989258, "max_norm/layer1": 20.078290939331055, "max_norm/layer10": 21.511146545410156, "max_norm/layer11": 20.23717498779297, "max_norm/layer12": 21.525150299072266, "max_norm/layer13": 18.80620765686035, "max_norm/layer14": 20.277151107788086, "max_norm/layer15": 22.951562881469727, "max_norm/layer16": 19.92555809020996, "max_norm/layer17": 22.931133270263672, "max_norm/layer18": 20.521669387817383, "max_norm/layer19": 20.11891746520996, "max_norm/layer2": 16.537145614624023, "max_norm/layer20": 21.444211959838867, "max_norm/layer21": 20.847387313842773, "max_norm/layer22": 21.34566879272461, "max_norm/layer23": 20.86615562438965, "max_norm/layer3": 19.326074600219727, "max_norm/layer4": 19.71425437927246, "max_norm/layer5": 23.937562942504883, "max_norm/layer6": 17.873159408569336, "max_norm/layer7": 20.806289672851562, "max_norm/layer8": 21.297988891601562, "max_norm/layer9": 20.845129013061523, "mean_norm": 9.841606857875982, "mean_norm/layer0": 9.368158996105194, "mean_norm/layer1": 9.410395383834839, "mean_norm/layer10": 9.74589717388153, "mean_norm/layer11": 9.952390968799591, "mean_norm/layer12": 10.265121459960938, "mean_norm/layer13": 9.707781314849854, "mean_norm/layer14": 9.996495127677917, "mean_norm/layer15": 10.20052945613861, "mean_norm/layer16": 9.78744912147522, "mean_norm/layer17": 10.157939553260803, "mean_norm/layer18": 9.85572999715805, "mean_norm/layer19": 9.879987061023712, "mean_norm/layer2": 8.581217646598816, "mean_norm/layer20": 9.981558501720428, "mean_norm/layer21": 9.935706377029419, "mean_norm/layer22": 10.596454083919525, "mean_norm/layer23": 10.555343270301819, "mean_norm/layer3": 10.10208147764206, "mean_norm/layer4": 9.36821448802948, "mean_norm/layer5": 10.906881392002106, "mean_norm/layer6": 9.04877257347107, "mean_norm/layer7": 9.397431671619415, "mean_norm/layer8": 9.720013678073883, "mean_norm/layer9": 9.67701381444931, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5550 }, { "epoch": 2.32, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45954255444283554, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7617156505584717, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8254, "eval_samples_per_second": 20.38, "eval_steps_per_second": 0.677, "step": 5550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.34, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6786, "max_norm": 24.050399780273438, "max_norm/layer0": 18.92856788635254, "max_norm/layer1": 20.19409942626953, "max_norm/layer10": 21.61579704284668, "max_norm/layer11": 20.31001853942871, "max_norm/layer12": 21.62428092956543, "max_norm/layer13": 18.889577865600586, "max_norm/layer14": 20.359472274780273, "max_norm/layer15": 23.067659378051758, "max_norm/layer16": 20.03011131286621, "max_norm/layer17": 23.0419864654541, "max_norm/layer18": 20.61798667907715, "max_norm/layer19": 20.219560623168945, "max_norm/layer2": 16.568180084228516, "max_norm/layer20": 21.540401458740234, "max_norm/layer21": 20.965660095214844, "max_norm/layer22": 21.44856071472168, "max_norm/layer23": 20.963855743408203, "max_norm/layer3": 19.419219970703125, "max_norm/layer4": 19.802261352539062, "max_norm/layer5": 24.050399780273438, "max_norm/layer6": 17.924131393432617, "max_norm/layer7": 20.910070419311523, "max_norm/layer8": 21.38106918334961, "max_norm/layer9": 20.933855056762695, "mean_norm": 9.853289564450582, "mean_norm/layer0": 9.379805266857147, "mean_norm/layer1": 9.420386135578156, "mean_norm/layer10": 9.756702065467834, "mean_norm/layer11": 9.96448564529419, "mean_norm/layer12": 10.279956340789795, "mean_norm/layer13": 9.718806564807892, "mean_norm/layer14": 10.008846938610077, "mean_norm/layer15": 10.214514553546906, "mean_norm/layer16": 9.798823893070221, "mean_norm/layer17": 10.17122620344162, "mean_norm/layer18": 9.867085695266724, "mean_norm/layer19": 9.89163064956665, "mean_norm/layer2": 8.58489179611206, "mean_norm/layer20": 9.993090152740479, "mean_norm/layer21": 9.947735130786896, "mean_norm/layer22": 10.612680315971375, "mean_norm/layer23": 10.571164965629578, "mean_norm/layer3": 10.11597990989685, "mean_norm/layer4": 9.376480102539062, "mean_norm/layer5": 10.925587713718414, "mean_norm/layer6": 9.055172681808472, "mean_norm/layer7": 9.405917942523956, "mean_norm/layer8": 9.730691254138947, "mean_norm/layer9": 9.687287628650665, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5600 }, { "epoch": 2.34, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45928702092535584, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.764376401901245, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8216, "eval_samples_per_second": 20.386, "eval_steps_per_second": 0.677, "step": 5600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.36, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6938, "max_norm": 24.169326782226562, "max_norm/layer0": 19.0015926361084, "max_norm/layer1": 20.306058883666992, "max_norm/layer10": 21.70053482055664, "max_norm/layer11": 20.392311096191406, "max_norm/layer12": 21.714736938476562, "max_norm/layer13": 18.960250854492188, "max_norm/layer14": 20.45236587524414, "max_norm/layer15": 23.201778411865234, "max_norm/layer16": 20.125362396240234, "max_norm/layer17": 23.156299591064453, "max_norm/layer18": 20.71641731262207, "max_norm/layer19": 20.32011604309082, "max_norm/layer2": 16.6474666595459, "max_norm/layer20": 21.623586654663086, "max_norm/layer21": 21.088895797729492, "max_norm/layer22": 21.558412551879883, "max_norm/layer23": 21.069276809692383, "max_norm/layer3": 19.493728637695312, "max_norm/layer4": 19.86513328552246, "max_norm/layer5": 24.169326782226562, "max_norm/layer6": 17.97091293334961, "max_norm/layer7": 21.01711654663086, "max_norm/layer8": 21.452049255371094, "max_norm/layer9": 21.005409240722656, "mean_norm": 9.864638393123945, "mean_norm/layer0": 9.3911452293396, "mean_norm/layer1": 9.430276334285736, "mean_norm/layer10": 9.767344295978546, "mean_norm/layer11": 9.976312398910522, "mean_norm/layer12": 10.294341802597046, "mean_norm/layer13": 9.729567348957062, "mean_norm/layer14": 10.02096837759018, "mean_norm/layer15": 10.228092610836029, "mean_norm/layer16": 9.809804558753967, "mean_norm/layer17": 10.18399292230606, "mean_norm/layer18": 9.878075778484344, "mean_norm/layer19": 9.902792990207672, "mean_norm/layer2": 8.58851420879364, "mean_norm/layer20": 10.004315316677094, "mean_norm/layer21": 9.95916599035263, "mean_norm/layer22": 10.628167688846588, "mean_norm/layer23": 10.586232781410217, "mean_norm/layer3": 10.129510223865509, "mean_norm/layer4": 9.384777843952179, "mean_norm/layer5": 10.943991243839264, "mean_norm/layer6": 9.061299085617065, "mean_norm/layer7": 9.414314091205597, "mean_norm/layer8": 9.741056561470032, "mean_norm/layer9": 9.69726175069809, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5650 }, { "epoch": 2.36, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.45997655581379315, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.759434223175049, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5486, "eval_samples_per_second": 20.868, "eval_steps_per_second": 0.693, "step": 5650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.38, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6634, "max_norm": 24.302297592163086, "max_norm/layer0": 19.074230194091797, "max_norm/layer1": 20.415058135986328, "max_norm/layer10": 21.800249099731445, "max_norm/layer11": 20.47414779663086, "max_norm/layer12": 21.825576782226562, "max_norm/layer13": 19.0487060546875, "max_norm/layer14": 20.540529251098633, "max_norm/layer15": 23.310043334960938, "max_norm/layer16": 20.21319007873535, "max_norm/layer17": 23.27543067932129, "max_norm/layer18": 20.82416534423828, "max_norm/layer19": 20.435667037963867, "max_norm/layer2": 16.726856231689453, "max_norm/layer20": 21.711185455322266, "max_norm/layer21": 21.18751335144043, "max_norm/layer22": 21.662084579467773, "max_norm/layer23": 21.18093490600586, "max_norm/layer3": 19.574790954589844, "max_norm/layer4": 19.932098388671875, "max_norm/layer5": 24.302297592163086, "max_norm/layer6": 18.029502868652344, "max_norm/layer7": 21.126331329345703, "max_norm/layer8": 21.547332763671875, "max_norm/layer9": 21.09630584716797, "mean_norm": 9.876142094532648, "mean_norm/layer0": 9.402709722518921, "mean_norm/layer1": 9.440324366092682, "mean_norm/layer10": 9.777914643287659, "mean_norm/layer11": 9.988339364528656, "mean_norm/layer12": 10.308962106704712, "mean_norm/layer13": 9.740558981895447, "mean_norm/layer14": 10.03328812122345, "mean_norm/layer15": 10.241935729980469, "mean_norm/layer16": 9.820912420749664, "mean_norm/layer17": 10.196899771690369, "mean_norm/layer18": 9.889229655265808, "mean_norm/layer19": 9.913987636566162, "mean_norm/layer2": 8.59205949306488, "mean_norm/layer20": 10.01566457748413, "mean_norm/layer21": 9.970516860485077, "mean_norm/layer22": 10.643815875053406, "mean_norm/layer23": 10.601855099201202, "mean_norm/layer3": 10.143052756786346, "mean_norm/layer4": 9.393064022064209, "mean_norm/layer5": 10.962677597999573, "mean_norm/layer6": 9.067675769329071, "mean_norm/layer7": 9.4227814078331, "mean_norm/layer8": 9.751694977283478, "mean_norm/layer9": 9.707489311695099, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5700 }, { "epoch": 2.38, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4612258307881384, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.753422975540161, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8169, "eval_samples_per_second": 20.395, "eval_steps_per_second": 0.677, "step": 5700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.4, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6744, "max_norm": 24.415847778320312, "max_norm/layer0": 19.146425247192383, "max_norm/layer1": 20.51773452758789, "max_norm/layer10": 21.890947341918945, "max_norm/layer11": 20.550748825073242, "max_norm/layer12": 21.946949005126953, "max_norm/layer13": 19.112741470336914, "max_norm/layer14": 20.610857009887695, "max_norm/layer15": 23.442441940307617, "max_norm/layer16": 20.31297492980957, "max_norm/layer17": 23.392274856567383, "max_norm/layer18": 20.90896987915039, "max_norm/layer19": 20.549793243408203, "max_norm/layer2": 16.79773712158203, "max_norm/layer20": 21.813404083251953, "max_norm/layer21": 21.293352127075195, "max_norm/layer22": 21.788415908813477, "max_norm/layer23": 21.271108627319336, "max_norm/layer3": 19.66872787475586, "max_norm/layer4": 19.997684478759766, "max_norm/layer5": 24.415847778320312, "max_norm/layer6": 18.082775115966797, "max_norm/layer7": 21.22279167175293, "max_norm/layer8": 21.611251831054688, "max_norm/layer9": 21.174211502075195, "mean_norm": 9.887629655500254, "mean_norm/layer0": 9.41416311264038, "mean_norm/layer1": 9.450378060340881, "mean_norm/layer10": 9.788468480110168, "mean_norm/layer11": 10.000294208526611, "mean_norm/layer12": 10.323612809181213, "mean_norm/layer13": 9.751441478729248, "mean_norm/layer14": 10.045649409294128, "mean_norm/layer15": 10.255648970603943, "mean_norm/layer16": 9.831993281841278, "mean_norm/layer17": 10.209833085536957, "mean_norm/layer18": 9.900463461875916, "mean_norm/layer19": 9.925138771533966, "mean_norm/layer2": 8.595655858516693, "mean_norm/layer20": 10.027330756187439, "mean_norm/layer21": 9.981902122497559, "mean_norm/layer22": 10.65961903333664, "mean_norm/layer23": 10.617213129997253, "mean_norm/layer3": 10.156732320785522, "mean_norm/layer4": 9.401276051998138, "mean_norm/layer5": 10.9812912940979, "mean_norm/layer6": 9.073957800865173, "mean_norm/layer7": 9.43110179901123, "mean_norm/layer8": 9.762260735034943, "mean_norm/layer9": 9.71768569946289, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5750 }, { "epoch": 2.4, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46095812900792155, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7510087490081787, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6121, "eval_samples_per_second": 20.754, "eval_steps_per_second": 0.689, "step": 5750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.42, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6799, "max_norm": 24.525354385375977, "max_norm/layer0": 19.21927833557129, "max_norm/layer1": 20.611085891723633, "max_norm/layer10": 21.969202041625977, "max_norm/layer11": 20.64573860168457, "max_norm/layer12": 22.06580352783203, "max_norm/layer13": 19.187246322631836, "max_norm/layer14": 20.70265007019043, "max_norm/layer15": 23.571685791015625, "max_norm/layer16": 20.39738655090332, "max_norm/layer17": 23.50619125366211, "max_norm/layer18": 20.994590759277344, "max_norm/layer19": 20.64227867126465, "max_norm/layer2": 16.8626651763916, "max_norm/layer20": 21.89752197265625, "max_norm/layer21": 21.396255493164062, "max_norm/layer22": 21.888132095336914, "max_norm/layer23": 21.377004623413086, "max_norm/layer3": 19.76741600036621, "max_norm/layer4": 20.093164443969727, "max_norm/layer5": 24.525354385375977, "max_norm/layer6": 18.127910614013672, "max_norm/layer7": 21.337644577026367, "max_norm/layer8": 21.689964294433594, "max_norm/layer9": 21.269315719604492, "mean_norm": 9.899055920541286, "mean_norm/layer0": 9.425514936447144, "mean_norm/layer1": 9.460303664207458, "mean_norm/layer10": 9.798951029777527, "mean_norm/layer11": 10.012129306793213, "mean_norm/layer12": 10.338140368461609, "mean_norm/layer13": 9.762259364128113, "mean_norm/layer14": 10.057992458343506, "mean_norm/layer15": 10.26939058303833, "mean_norm/layer16": 9.843165934085846, "mean_norm/layer17": 10.222750306129456, "mean_norm/layer18": 9.911642968654633, "mean_norm/layer19": 9.936326265335083, "mean_norm/layer2": 8.599254548549652, "mean_norm/layer20": 10.038680911064148, "mean_norm/layer21": 9.993187129497528, "mean_norm/layer22": 10.675156891345978, "mean_norm/layer23": 10.632552742958069, "mean_norm/layer3": 10.170215964317322, "mean_norm/layer4": 9.40942233800888, "mean_norm/layer5": 10.999845743179321, "mean_norm/layer6": 9.080201625823975, "mean_norm/layer7": 9.439405918121338, "mean_norm/layer8": 9.772936880588531, "mean_norm/layer9": 9.727914214134216, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5800 }, { "epoch": 2.42, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4608202220302341, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7505526542663574, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7927, "eval_samples_per_second": 20.436, "eval_steps_per_second": 0.678, "step": 5800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.44, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6799, "max_norm": 24.64824676513672, "max_norm/layer0": 19.30046844482422, "max_norm/layer1": 20.69877815246582, "max_norm/layer10": 22.053220748901367, "max_norm/layer11": 20.724355697631836, "max_norm/layer12": 22.196802139282227, "max_norm/layer13": 19.268417358398438, "max_norm/layer14": 20.79410171508789, "max_norm/layer15": 23.694843292236328, "max_norm/layer16": 20.494922637939453, "max_norm/layer17": 23.64689064025879, "max_norm/layer18": 21.078306198120117, "max_norm/layer19": 20.727556228637695, "max_norm/layer2": 16.929187774658203, "max_norm/layer20": 21.985841751098633, "max_norm/layer21": 21.498451232910156, "max_norm/layer22": 21.993858337402344, "max_norm/layer23": 21.484207153320312, "max_norm/layer3": 19.888816833496094, "max_norm/layer4": 20.171184539794922, "max_norm/layer5": 24.64824676513672, "max_norm/layer6": 18.182086944580078, "max_norm/layer7": 21.449859619140625, "max_norm/layer8": 21.770164489746094, "max_norm/layer9": 21.34680938720703, "mean_norm": 9.910489511986574, "mean_norm/layer0": 9.436944603919983, "mean_norm/layer1": 9.470270037651062, "mean_norm/layer10": 9.809482991695404, "mean_norm/layer11": 10.023900032043457, "mean_norm/layer12": 10.35284686088562, "mean_norm/layer13": 9.773071646690369, "mean_norm/layer14": 10.070310354232788, "mean_norm/layer15": 10.283128798007965, "mean_norm/layer16": 9.854249835014343, "mean_norm/layer17": 10.235677301883698, "mean_norm/layer18": 9.922667562961578, "mean_norm/layer19": 9.947410225868225, "mean_norm/layer2": 8.602798521518707, "mean_norm/layer20": 10.04989892244339, "mean_norm/layer21": 10.00466388463974, "mean_norm/layer22": 10.69081175327301, "mean_norm/layer23": 10.647965610027313, "mean_norm/layer3": 10.18393588066101, "mean_norm/layer4": 9.417515218257904, "mean_norm/layer5": 11.018384039402008, "mean_norm/layer6": 9.086404740810394, "mean_norm/layer7": 9.447878897190094, "mean_norm/layer8": 9.78347784280777, "mean_norm/layer9": 9.738052725791931, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5850 }, { "epoch": 2.44, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4599846679889512, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.754044771194458, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8217, "eval_samples_per_second": 20.386, "eval_steps_per_second": 0.677, "step": 5850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.46, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6767, "max_norm": 24.753965377807617, "max_norm/layer0": 19.378158569335938, "max_norm/layer1": 20.807764053344727, "max_norm/layer10": 22.12616539001465, "max_norm/layer11": 20.805105209350586, "max_norm/layer12": 22.287803649902344, "max_norm/layer13": 19.338436126708984, "max_norm/layer14": 20.869544982910156, "max_norm/layer15": 23.80994987487793, "max_norm/layer16": 20.60982894897461, "max_norm/layer17": 23.77663230895996, "max_norm/layer18": 21.178482055664062, "max_norm/layer19": 20.830650329589844, "max_norm/layer2": 16.985960006713867, "max_norm/layer20": 22.095294952392578, "max_norm/layer21": 21.586101531982422, "max_norm/layer22": 22.09933090209961, "max_norm/layer23": 21.59579849243164, "max_norm/layer3": 20.020875930786133, "max_norm/layer4": 20.229372024536133, "max_norm/layer5": 24.753965377807617, "max_norm/layer6": 18.241554260253906, "max_norm/layer7": 21.56122589111328, "max_norm/layer8": 21.847877502441406, "max_norm/layer9": 21.414751052856445, "mean_norm": 9.92179693778356, "mean_norm/layer0": 9.448293924331665, "mean_norm/layer1": 9.480082273483276, "mean_norm/layer10": 9.82001268863678, "mean_norm/layer11": 10.035534679889679, "mean_norm/layer12": 10.367335975170135, "mean_norm/layer13": 9.783747255802155, "mean_norm/layer14": 10.08247172832489, "mean_norm/layer15": 10.296784579753876, "mean_norm/layer16": 9.865318357944489, "mean_norm/layer17": 10.248357355594635, "mean_norm/layer18": 9.933477759361267, "mean_norm/layer19": 9.958428800106049, "mean_norm/layer2": 8.606263518333435, "mean_norm/layer20": 10.06111353635788, "mean_norm/layer21": 10.016002595424652, "mean_norm/layer22": 10.70626699924469, "mean_norm/layer23": 10.663025915622711, "mean_norm/layer3": 10.197382926940918, "mean_norm/layer4": 9.42559802532196, "mean_norm/layer5": 11.036820828914642, "mean_norm/layer6": 9.092549324035645, "mean_norm/layer7": 9.456212759017944, "mean_norm/layer8": 9.79387241601944, "mean_norm/layer9": 9.748172283172607, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5900 }, { "epoch": 2.46, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4604754545860154, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.751302719116211, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5986, "eval_samples_per_second": 20.778, "eval_steps_per_second": 0.69, "step": 5900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.48, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6723, "max_norm": 24.86185073852539, "max_norm/layer0": 19.464832305908203, "max_norm/layer1": 20.904747009277344, "max_norm/layer10": 22.21963882446289, "max_norm/layer11": 20.90224838256836, "max_norm/layer12": 22.370943069458008, "max_norm/layer13": 19.404891967773438, "max_norm/layer14": 20.9664249420166, "max_norm/layer15": 23.94396209716797, "max_norm/layer16": 20.73137664794922, "max_norm/layer17": 23.91629409790039, "max_norm/layer18": 21.258281707763672, "max_norm/layer19": 20.940629959106445, "max_norm/layer2": 17.0539493560791, "max_norm/layer20": 22.18185043334961, "max_norm/layer21": 21.683847427368164, "max_norm/layer22": 22.20035171508789, "max_norm/layer23": 21.70345115661621, "max_norm/layer3": 20.125995635986328, "max_norm/layer4": 20.29149055480957, "max_norm/layer5": 24.86185073852539, "max_norm/layer6": 18.295093536376953, "max_norm/layer7": 21.663230895996094, "max_norm/layer8": 21.92238426208496, "max_norm/layer9": 21.488218307495117, "mean_norm": 9.932985362907251, "mean_norm/layer0": 9.459501802921295, "mean_norm/layer1": 9.489829063415527, "mean_norm/layer10": 9.830254077911377, "mean_norm/layer11": 10.04719090461731, "mean_norm/layer12": 10.381703913211823, "mean_norm/layer13": 9.79422265291214, "mean_norm/layer14": 10.094463765621185, "mean_norm/layer15": 10.310104370117188, "mean_norm/layer16": 9.876312971115112, "mean_norm/layer17": 10.260833084583282, "mean_norm/layer18": 9.944314777851105, "mean_norm/layer19": 9.969380855560303, "mean_norm/layer2": 8.609793603420258, "mean_norm/layer20": 10.072267889976501, "mean_norm/layer21": 10.027061522006989, "mean_norm/layer22": 10.721749186515808, "mean_norm/layer23": 10.678084135055542, "mean_norm/layer3": 10.210697650909424, "mean_norm/layer4": 9.433561861515045, "mean_norm/layer5": 11.054940581321716, "mean_norm/layer6": 9.098546802997589, "mean_norm/layer7": 9.46446293592453, "mean_norm/layer8": 9.804116070270538, "mean_norm/layer9": 9.75825423002243, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 5950 }, { "epoch": 2.48, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46160304693298937, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.748650074005127, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.808, "eval_samples_per_second": 22.298, "eval_steps_per_second": 0.74, "step": 5950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.51, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6815, "max_norm": 24.977638244628906, "max_norm/layer0": 19.546966552734375, "max_norm/layer1": 20.998462677001953, "max_norm/layer10": 22.314041137695312, "max_norm/layer11": 20.974071502685547, "max_norm/layer12": 22.48418617248535, "max_norm/layer13": 19.48900032043457, "max_norm/layer14": 21.050722122192383, "max_norm/layer15": 24.082304000854492, "max_norm/layer16": 20.837448120117188, "max_norm/layer17": 24.036243438720703, "max_norm/layer18": 21.340248107910156, "max_norm/layer19": 21.039228439331055, "max_norm/layer2": 17.137115478515625, "max_norm/layer20": 22.27361297607422, "max_norm/layer21": 21.761518478393555, "max_norm/layer22": 22.311800003051758, "max_norm/layer23": 21.796558380126953, "max_norm/layer3": 20.21436309814453, "max_norm/layer4": 20.353113174438477, "max_norm/layer5": 24.977638244628906, "max_norm/layer6": 18.35504150390625, "max_norm/layer7": 21.75100326538086, "max_norm/layer8": 22.014951705932617, "max_norm/layer9": 21.569259643554688, "mean_norm": 9.944234107931456, "mean_norm/layer0": 9.470636069774628, "mean_norm/layer1": 9.499629974365234, "mean_norm/layer10": 9.840614199638367, "mean_norm/layer11": 10.05879956483841, "mean_norm/layer12": 10.396033763885498, "mean_norm/layer13": 9.804863929748535, "mean_norm/layer14": 10.106550097465515, "mean_norm/layer15": 10.323493957519531, "mean_norm/layer16": 9.887224614620209, "mean_norm/layer17": 10.27337783575058, "mean_norm/layer18": 9.955014765262604, "mean_norm/layer19": 9.980344355106354, "mean_norm/layer2": 8.613344311714172, "mean_norm/layer20": 10.083471596240997, "mean_norm/layer21": 10.03798758983612, "mean_norm/layer22": 10.737454056739807, "mean_norm/layer23": 10.69325703382492, "mean_norm/layer3": 10.224131882190704, "mean_norm/layer4": 9.441782593727112, "mean_norm/layer5": 11.073285281658173, "mean_norm/layer6": 9.104702413082123, "mean_norm/layer7": 9.472704946994781, "mean_norm/layer8": 9.81453275680542, "mean_norm/layer9": 9.768380999565125, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6000 }, { "epoch": 2.51, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4614570277801438, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.746541976928711, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8304, "eval_samples_per_second": 20.371, "eval_steps_per_second": 0.676, "step": 6000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.53, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6786, "max_norm": 25.10230827331543, "max_norm/layer0": 19.610563278198242, "max_norm/layer1": 21.094833374023438, "max_norm/layer10": 22.392915725708008, "max_norm/layer11": 21.059268951416016, "max_norm/layer12": 22.60821533203125, "max_norm/layer13": 19.56475830078125, "max_norm/layer14": 21.15677833557129, "max_norm/layer15": 24.223785400390625, "max_norm/layer16": 20.94610595703125, "max_norm/layer17": 24.151611328125, "max_norm/layer18": 21.432071685791016, "max_norm/layer19": 21.153385162353516, "max_norm/layer2": 17.234243392944336, "max_norm/layer20": 22.37726593017578, "max_norm/layer21": 21.85563850402832, "max_norm/layer22": 22.410329818725586, "max_norm/layer23": 21.884920120239258, "max_norm/layer3": 20.298763275146484, "max_norm/layer4": 20.410865783691406, "max_norm/layer5": 25.10230827331543, "max_norm/layer6": 18.404077529907227, "max_norm/layer7": 21.845476150512695, "max_norm/layer8": 22.08577537536621, "max_norm/layer9": 21.64267349243164, "mean_norm": 9.955603557328383, "mean_norm/layer0": 9.481941640377045, "mean_norm/layer1": 9.509676814079285, "mean_norm/layer10": 9.851111769676208, "mean_norm/layer11": 10.070666432380676, "mean_norm/layer12": 10.410649418830872, "mean_norm/layer13": 9.815576553344727, "mean_norm/layer14": 10.118753135204315, "mean_norm/layer15": 10.337125837802887, "mean_norm/layer16": 9.898253440856934, "mean_norm/layer17": 10.28607988357544, "mean_norm/layer18": 9.965818166732788, "mean_norm/layer19": 9.991341471672058, "mean_norm/layer2": 8.616923332214355, "mean_norm/layer20": 10.094838857650757, "mean_norm/layer21": 10.049068450927734, "mean_norm/layer22": 10.753166139125824, "mean_norm/layer23": 10.708418011665344, "mean_norm/layer3": 10.237691342830658, "mean_norm/layer4": 9.450024247169495, "mean_norm/layer5": 11.09180212020874, "mean_norm/layer6": 9.110926032066345, "mean_norm/layer7": 9.481049478054047, "mean_norm/layer8": 9.825046956539154, "mean_norm/layer9": 9.778535842895508, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6050 }, { "epoch": 2.53, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4603294354331699, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7469117641448975, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7837, "eval_samples_per_second": 20.452, "eval_steps_per_second": 0.679, "step": 6050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.55, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6766, "max_norm": 25.228403091430664, "max_norm/layer0": 19.683305740356445, "max_norm/layer1": 21.202486038208008, "max_norm/layer10": 22.478837966918945, "max_norm/layer11": 21.12628173828125, "max_norm/layer12": 22.69508171081543, "max_norm/layer13": 19.65280532836914, "max_norm/layer14": 21.235212326049805, "max_norm/layer15": 24.364246368408203, "max_norm/layer16": 21.056020736694336, "max_norm/layer17": 24.269739151000977, "max_norm/layer18": 21.526058197021484, "max_norm/layer19": 21.24538230895996, "max_norm/layer2": 17.323163986206055, "max_norm/layer20": 22.47141456604004, "max_norm/layer21": 21.953645706176758, "max_norm/layer22": 22.524587631225586, "max_norm/layer23": 21.973390579223633, "max_norm/layer3": 20.381038665771484, "max_norm/layer4": 20.474964141845703, "max_norm/layer5": 25.228403091430664, "max_norm/layer6": 18.45362663269043, "max_norm/layer7": 21.947711944580078, "max_norm/layer8": 22.164188385009766, "max_norm/layer9": 21.733667373657227, "mean_norm": 9.966820580263933, "mean_norm/layer0": 9.493147373199463, "mean_norm/layer1": 9.51956021785736, "mean_norm/layer10": 9.861493289470673, "mean_norm/layer11": 10.082270801067352, "mean_norm/layer12": 10.42505133152008, "mean_norm/layer13": 9.8261559009552, "mean_norm/layer14": 10.130703926086426, "mean_norm/layer15": 10.350493848323822, "mean_norm/layer16": 9.909152209758759, "mean_norm/layer17": 10.298548698425293, "mean_norm/layer18": 9.976577043533325, "mean_norm/layer19": 10.002244293689728, "mean_norm/layer2": 8.620338201522827, "mean_norm/layer20": 10.106268465518951, "mean_norm/layer21": 10.06009829044342, "mean_norm/layer22": 10.768470168113708, "mean_norm/layer23": 10.723572373390198, "mean_norm/layer3": 10.250972270965576, "mean_norm/layer4": 9.458167791366577, "mean_norm/layer5": 11.110156893730164, "mean_norm/layer6": 9.117044448852539, "mean_norm/layer7": 9.489368438720703, "mean_norm/layer8": 9.835336029529572, "mean_norm/layer9": 9.788501620292664, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6100 }, { "epoch": 2.55, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4611447090365575, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7434680461883545, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8476, "eval_samples_per_second": 20.342, "eval_steps_per_second": 0.675, "step": 6100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.57, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6922, "max_norm": 25.344696044921875, "max_norm/layer0": 19.766042709350586, "max_norm/layer1": 21.28939437866211, "max_norm/layer10": 22.563648223876953, "max_norm/layer11": 21.195743560791016, "max_norm/layer12": 22.773914337158203, "max_norm/layer13": 19.732276916503906, "max_norm/layer14": 21.32152557373047, "max_norm/layer15": 24.493183135986328, "max_norm/layer16": 21.16498374938965, "max_norm/layer17": 24.38330841064453, "max_norm/layer18": 21.610130310058594, "max_norm/layer19": 21.38445281982422, "max_norm/layer2": 17.382400512695312, "max_norm/layer20": 22.576610565185547, "max_norm/layer21": 22.033180236816406, "max_norm/layer22": 22.632516860961914, "max_norm/layer23": 22.06123161315918, "max_norm/layer3": 20.473676681518555, "max_norm/layer4": 20.537517547607422, "max_norm/layer5": 25.344696044921875, "max_norm/layer6": 18.493179321289062, "max_norm/layer7": 22.041973114013672, "max_norm/layer8": 22.243497848510742, "max_norm/layer9": 21.801977157592773, "mean_norm": 9.97796812405189, "mean_norm/layer0": 9.504401445388794, "mean_norm/layer1": 9.529353737831116, "mean_norm/layer10": 9.871827602386475, "mean_norm/layer11": 10.093893706798553, "mean_norm/layer12": 10.439537703990936, "mean_norm/layer13": 9.83659952878952, "mean_norm/layer14": 10.142653703689575, "mean_norm/layer15": 10.363728702068329, "mean_norm/layer16": 9.919947028160095, "mean_norm/layer17": 10.310964286327362, "mean_norm/layer18": 9.987221598625183, "mean_norm/layer19": 10.013190269470215, "mean_norm/layer2": 8.623740553855896, "mean_norm/layer20": 10.117258369922638, "mean_norm/layer21": 10.071050822734833, "mean_norm/layer22": 10.78360378742218, "mean_norm/layer23": 10.73860216140747, "mean_norm/layer3": 10.264272034168243, "mean_norm/layer4": 9.466197848320007, "mean_norm/layer5": 11.12835305929184, "mean_norm/layer6": 9.123260974884033, "mean_norm/layer7": 9.497576415538788, "mean_norm/layer8": 9.845619022846222, "mean_norm/layer9": 9.798380613327026, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6150 }, { "epoch": 2.57, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46083644638055027, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.742943286895752, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5803, "eval_samples_per_second": 20.811, "eval_steps_per_second": 0.691, "step": 6150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.59, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6689, "max_norm": 25.47237777709961, "max_norm/layer0": 19.861135482788086, "max_norm/layer1": 21.369943618774414, "max_norm/layer10": 22.645503997802734, "max_norm/layer11": 21.277894973754883, "max_norm/layer12": 22.86878204345703, "max_norm/layer13": 19.81595802307129, "max_norm/layer14": 21.395647048950195, "max_norm/layer15": 24.607105255126953, "max_norm/layer16": 21.273733139038086, "max_norm/layer17": 24.506553649902344, "max_norm/layer18": 21.704404830932617, "max_norm/layer19": 21.492938995361328, "max_norm/layer2": 17.44423484802246, "max_norm/layer20": 22.680187225341797, "max_norm/layer21": 22.106203079223633, "max_norm/layer22": 22.743715286254883, "max_norm/layer23": 22.155893325805664, "max_norm/layer3": 20.574127197265625, "max_norm/layer4": 20.620710372924805, "max_norm/layer5": 25.47237777709961, "max_norm/layer6": 18.549198150634766, "max_norm/layer7": 22.10602569580078, "max_norm/layer8": 22.323543548583984, "max_norm/layer9": 21.855295181274414, "mean_norm": 9.988959466417631, "mean_norm/layer0": 9.515448808670044, "mean_norm/layer1": 9.53911018371582, "mean_norm/layer10": 9.881972074508667, "mean_norm/layer11": 10.105316400527954, "mean_norm/layer12": 10.45355623960495, "mean_norm/layer13": 9.846928358078003, "mean_norm/layer14": 10.154405415058136, "mean_norm/layer15": 10.376791179180145, "mean_norm/layer16": 9.930635511875153, "mean_norm/layer17": 10.323196768760681, "mean_norm/layer18": 9.997608542442322, "mean_norm/layer19": 10.023785591125488, "mean_norm/layer2": 8.627090692520142, "mean_norm/layer20": 10.128102242946625, "mean_norm/layer21": 10.081976056098938, "mean_norm/layer22": 10.798811733722687, "mean_norm/layer23": 10.753395140171051, "mean_norm/layer3": 10.277292788028717, "mean_norm/layer4": 9.473982751369476, "mean_norm/layer5": 11.146383464336395, "mean_norm/layer6": 9.129413843154907, "mean_norm/layer7": 9.505711376667023, "mean_norm/layer8": 9.855893790721893, "mean_norm/layer9": 9.808218240737915, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6200 }, { "epoch": 2.59, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4616557760715169, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.739611864089966, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8022, "eval_samples_per_second": 20.42, "eval_steps_per_second": 0.678, "step": 6200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.61, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6832, "max_norm": 25.609737396240234, "max_norm/layer0": 19.959583282470703, "max_norm/layer1": 21.443889617919922, "max_norm/layer10": 22.741214752197266, "max_norm/layer11": 21.409526824951172, "max_norm/layer12": 22.951099395751953, "max_norm/layer13": 19.897159576416016, "max_norm/layer14": 21.47847557067871, "max_norm/layer15": 24.755695343017578, "max_norm/layer16": 21.364933013916016, "max_norm/layer17": 24.639934539794922, "max_norm/layer18": 21.792865753173828, "max_norm/layer19": 21.58719825744629, "max_norm/layer2": 17.523984909057617, "max_norm/layer20": 22.785497665405273, "max_norm/layer21": 22.198741912841797, "max_norm/layer22": 22.869951248168945, "max_norm/layer23": 22.246004104614258, "max_norm/layer3": 20.67522430419922, "max_norm/layer4": 20.69664764404297, "max_norm/layer5": 25.609737396240234, "max_norm/layer6": 18.605470657348633, "max_norm/layer7": 22.189006805419922, "max_norm/layer8": 22.403486251831055, "max_norm/layer9": 21.930519104003906, "mean_norm": 9.9999838595589, "mean_norm/layer0": 9.526455461978912, "mean_norm/layer1": 9.548912286758423, "mean_norm/layer10": 9.892246067523956, "mean_norm/layer11": 10.116952002048492, "mean_norm/layer12": 10.467663824558258, "mean_norm/layer13": 9.857439279556274, "mean_norm/layer14": 10.166240513324738, "mean_norm/layer15": 10.390120685100555, "mean_norm/layer16": 9.941468596458435, "mean_norm/layer17": 10.335450530052185, "mean_norm/layer18": 10.008020222187042, "mean_norm/layer19": 10.034397423267365, "mean_norm/layer2": 8.630433797836304, "mean_norm/layer20": 10.139144003391266, "mean_norm/layer21": 10.092650175094604, "mean_norm/layer22": 10.813849329948425, "mean_norm/layer23": 10.767933666706085, "mean_norm/layer3": 10.290472090244293, "mean_norm/layer4": 9.481958389282227, "mean_norm/layer5": 11.164432644844055, "mean_norm/layer6": 9.135431170463562, "mean_norm/layer7": 9.513876497745514, "mean_norm/layer8": 9.866037726402283, "mean_norm/layer9": 9.81802624464035, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6250 }, { "epoch": 2.61, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46189914132625953, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.735955238342285, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9699, "eval_samples_per_second": 20.134, "eval_steps_per_second": 0.668, "step": 6250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.63, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6732, "max_norm": 25.74430274963379, "max_norm/layer0": 20.05502700805664, "max_norm/layer1": 21.517070770263672, "max_norm/layer10": 22.837778091430664, "max_norm/layer11": 21.497528076171875, "max_norm/layer12": 23.044620513916016, "max_norm/layer13": 20.000743865966797, "max_norm/layer14": 21.55751609802246, "max_norm/layer15": 24.904428482055664, "max_norm/layer16": 21.46048355102539, "max_norm/layer17": 24.752845764160156, "max_norm/layer18": 21.87999725341797, "max_norm/layer19": 21.66996955871582, "max_norm/layer2": 17.590194702148438, "max_norm/layer20": 22.889404296875, "max_norm/layer21": 22.268436431884766, "max_norm/layer22": 22.98247718811035, "max_norm/layer23": 22.344642639160156, "max_norm/layer3": 20.77219009399414, "max_norm/layer4": 20.779855728149414, "max_norm/layer5": 25.74430274963379, "max_norm/layer6": 18.65287208557129, "max_norm/layer7": 22.270421981811523, "max_norm/layer8": 22.518630981445312, "max_norm/layer9": 22.00423812866211, "mean_norm": 10.011001144846281, "mean_norm/layer0": 9.537546277046204, "mean_norm/layer1": 9.558590412139893, "mean_norm/layer10": 9.902466833591461, "mean_norm/layer11": 10.128420174121857, "mean_norm/layer12": 10.481824576854706, "mean_norm/layer13": 9.867795050144196, "mean_norm/layer14": 10.178068697452545, "mean_norm/layer15": 10.403307795524597, "mean_norm/layer16": 9.952224373817444, "mean_norm/layer17": 10.34775185585022, "mean_norm/layer18": 10.018373608589172, "mean_norm/layer19": 10.04506230354309, "mean_norm/layer2": 8.633818507194519, "mean_norm/layer20": 10.15004014968872, "mean_norm/layer21": 10.103437781333923, "mean_norm/layer22": 10.828993797302246, "mean_norm/layer23": 10.78253710269928, "mean_norm/layer3": 10.30362993478775, "mean_norm/layer4": 9.489933848381042, "mean_norm/layer5": 11.182459115982056, "mean_norm/layer6": 9.141457200050354, "mean_norm/layer7": 9.522015750408173, "mean_norm/layer8": 9.876333832740784, "mean_norm/layer9": 9.827938497066498, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6300 }, { "epoch": 2.63, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46196809481510326, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.738924503326416, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9635, "eval_samples_per_second": 20.145, "eval_steps_per_second": 0.669, "step": 6300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.65, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6893, "max_norm": 25.860660552978516, "max_norm/layer0": 20.153108596801758, "max_norm/layer1": 21.598623275756836, "max_norm/layer10": 22.939794540405273, "max_norm/layer11": 21.61341094970703, "max_norm/layer12": 23.165863037109375, "max_norm/layer13": 20.091089248657227, "max_norm/layer14": 21.64145278930664, "max_norm/layer15": 25.02685546875, "max_norm/layer16": 21.53008460998535, "max_norm/layer17": 24.88070297241211, "max_norm/layer18": 21.985137939453125, "max_norm/layer19": 21.748992919921875, "max_norm/layer2": 17.670303344726562, "max_norm/layer20": 22.993227005004883, "max_norm/layer21": 22.341312408447266, "max_norm/layer22": 23.091922760009766, "max_norm/layer23": 22.425304412841797, "max_norm/layer3": 20.88212776184082, "max_norm/layer4": 20.852691650390625, "max_norm/layer5": 25.860660552978516, "max_norm/layer6": 18.694791793823242, "max_norm/layer7": 22.36998748779297, "max_norm/layer8": 22.611835479736328, "max_norm/layer9": 22.073123931884766, "mean_norm": 10.021994044383367, "mean_norm/layer0": 9.548484921455383, "mean_norm/layer1": 9.568365037441254, "mean_norm/layer10": 9.912571847438812, "mean_norm/layer11": 10.139825105667114, "mean_norm/layer12": 10.495871722698212, "mean_norm/layer13": 9.878227055072784, "mean_norm/layer14": 10.189821481704712, "mean_norm/layer15": 10.416566729545593, "mean_norm/layer16": 9.962967872619629, "mean_norm/layer17": 10.359967112541199, "mean_norm/layer18": 10.028738617897034, "mean_norm/layer19": 10.05587649345398, "mean_norm/layer2": 8.637226641178131, "mean_norm/layer20": 10.160935282707214, "mean_norm/layer21": 10.114270150661469, "mean_norm/layer22": 10.844156503677368, "mean_norm/layer23": 10.797121524810791, "mean_norm/layer3": 10.316659390926361, "mean_norm/layer4": 9.497858464717865, "mean_norm/layer5": 11.200486063957214, "mean_norm/layer6": 9.147541284561157, "mean_norm/layer7": 9.530200600624084, "mean_norm/layer8": 9.886442244052887, "mean_norm/layer9": 9.837674915790558, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6350 }, { "epoch": 2.65, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4616557760715169, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.738407850265503, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.894, "eval_samples_per_second": 20.262, "eval_steps_per_second": 0.673, "step": 6350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.67, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6801, "max_norm": 25.973201751708984, "max_norm/layer0": 20.24967384338379, "max_norm/layer1": 21.692955017089844, "max_norm/layer10": 23.032072067260742, "max_norm/layer11": 21.712499618530273, "max_norm/layer12": 23.234333038330078, "max_norm/layer13": 20.183149337768555, "max_norm/layer14": 21.744234085083008, "max_norm/layer15": 25.175216674804688, "max_norm/layer16": 21.600980758666992, "max_norm/layer17": 25.01777458190918, "max_norm/layer18": 22.099838256835938, "max_norm/layer19": 21.83799171447754, "max_norm/layer2": 17.750036239624023, "max_norm/layer20": 23.09636688232422, "max_norm/layer21": 22.446022033691406, "max_norm/layer22": 23.194242477416992, "max_norm/layer23": 22.509754180908203, "max_norm/layer3": 20.972686767578125, "max_norm/layer4": 20.944406509399414, "max_norm/layer5": 25.973201751708984, "max_norm/layer6": 18.7388858795166, "max_norm/layer7": 22.43354606628418, "max_norm/layer8": 22.72319221496582, "max_norm/layer9": 22.152870178222656, "mean_norm": 10.033037247757116, "mean_norm/layer0": 9.559500932693481, "mean_norm/layer1": 9.57817429304123, "mean_norm/layer10": 9.92283582687378, "mean_norm/layer11": 10.151250958442688, "mean_norm/layer12": 10.510083556175232, "mean_norm/layer13": 9.888749897480011, "mean_norm/layer14": 10.201764583587646, "mean_norm/layer15": 10.429744482040405, "mean_norm/layer16": 9.973683893680573, "mean_norm/layer17": 10.372322142124176, "mean_norm/layer18": 10.039182603359222, "mean_norm/layer19": 10.066715955734253, "mean_norm/layer2": 8.640654444694519, "mean_norm/layer20": 10.171599209308624, "mean_norm/layer21": 10.125025808811188, "mean_norm/layer22": 10.859051883220673, "mean_norm/layer23": 10.811841130256653, "mean_norm/layer3": 10.329941034317017, "mean_norm/layer4": 9.505902767181396, "mean_norm/layer5": 11.218784868717194, "mean_norm/layer6": 9.153590142726898, "mean_norm/layer7": 9.538390636444092, "mean_norm/layer8": 9.896606981754303, "mean_norm/layer9": 9.847495913505554, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6400 }, { "epoch": 2.67, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.462511610550695, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.732863664627075, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8118, "eval_samples_per_second": 20.403, "eval_steps_per_second": 0.677, "step": 6400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.69, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6817, "max_norm": 26.08163070678711, "max_norm/layer0": 20.342599868774414, "max_norm/layer1": 21.786935806274414, "max_norm/layer10": 23.1118106842041, "max_norm/layer11": 21.78784942626953, "max_norm/layer12": 23.314739227294922, "max_norm/layer13": 20.244739532470703, "max_norm/layer14": 21.830318450927734, "max_norm/layer15": 25.3209228515625, "max_norm/layer16": 21.691482543945312, "max_norm/layer17": 25.14759063720703, "max_norm/layer18": 22.2069034576416, "max_norm/layer19": 21.922334671020508, "max_norm/layer2": 17.808311462402344, "max_norm/layer20": 23.185317993164062, "max_norm/layer21": 22.515777587890625, "max_norm/layer22": 23.288124084472656, "max_norm/layer23": 22.597469329833984, "max_norm/layer3": 21.05324363708496, "max_norm/layer4": 21.01177215576172, "max_norm/layer5": 26.08163070678711, "max_norm/layer6": 18.78575325012207, "max_norm/layer7": 22.506237030029297, "max_norm/layer8": 22.81680679321289, "max_norm/layer9": 22.22559928894043, "mean_norm": 10.043887262543043, "mean_norm/layer0": 9.570309102535248, "mean_norm/layer1": 9.587825655937195, "mean_norm/layer10": 9.932947993278503, "mean_norm/layer11": 10.162622213363647, "mean_norm/layer12": 10.524069786071777, "mean_norm/layer13": 9.899032413959503, "mean_norm/layer14": 10.213397681713104, "mean_norm/layer15": 10.44272756576538, "mean_norm/layer16": 9.984095215797424, "mean_norm/layer17": 10.38427847623825, "mean_norm/layer18": 10.049458801746368, "mean_norm/layer19": 10.07730907201767, "mean_norm/layer2": 8.64402985572815, "mean_norm/layer20": 10.182213187217712, "mean_norm/layer21": 10.135670959949493, "mean_norm/layer22": 10.873790740966797, "mean_norm/layer23": 10.826238214969635, "mean_norm/layer3": 10.342928886413574, "mean_norm/layer4": 9.513796925544739, "mean_norm/layer5": 11.236631333827972, "mean_norm/layer6": 9.159627318382263, "mean_norm/layer7": 9.546464681625366, "mean_norm/layer8": 9.906689047813416, "mean_norm/layer9": 9.85713917016983, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6450 }, { "epoch": 2.69, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4634282863435587, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7291603088378906, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9312, "eval_samples_per_second": 22.047, "eval_steps_per_second": 0.732, "step": 6450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.71, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6874, "max_norm": 26.185462951660156, "max_norm/layer0": 20.429880142211914, "max_norm/layer1": 21.891557693481445, "max_norm/layer10": 23.196739196777344, "max_norm/layer11": 21.859304428100586, "max_norm/layer12": 23.41972541809082, "max_norm/layer13": 20.317655563354492, "max_norm/layer14": 21.93121337890625, "max_norm/layer15": 25.443115234375, "max_norm/layer16": 21.796695709228516, "max_norm/layer17": 25.274187088012695, "max_norm/layer18": 22.326488494873047, "max_norm/layer19": 22.01841163635254, "max_norm/layer2": 17.86547088623047, "max_norm/layer20": 23.280214309692383, "max_norm/layer21": 22.618255615234375, "max_norm/layer22": 23.38398551940918, "max_norm/layer23": 22.68142318725586, "max_norm/layer3": 21.130823135375977, "max_norm/layer4": 21.080659866333008, "max_norm/layer5": 26.185462951660156, "max_norm/layer6": 18.8240909576416, "max_norm/layer7": 22.595474243164062, "max_norm/layer8": 22.909751892089844, "max_norm/layer9": 22.31151008605957, "mean_norm": 10.054706205924353, "mean_norm/layer0": 9.581124305725098, "mean_norm/layer1": 9.597380995750427, "mean_norm/layer10": 9.9429412484169, "mean_norm/layer11": 10.173977673053741, "mean_norm/layer12": 10.537902593612671, "mean_norm/layer13": 9.909233927726746, "mean_norm/layer14": 10.225030422210693, "mean_norm/layer15": 10.455805003643036, "mean_norm/layer16": 9.994404911994934, "mean_norm/layer17": 10.396243751049042, "mean_norm/layer18": 10.059688329696655, "mean_norm/layer19": 10.08789175748825, "mean_norm/layer2": 8.647391676902771, "mean_norm/layer20": 10.192969799041748, "mean_norm/layer21": 10.14613652229309, "mean_norm/layer22": 10.88859474658966, "mean_norm/layer23": 10.8405082821846, "mean_norm/layer3": 10.355776727199554, "mean_norm/layer4": 9.52163827419281, "mean_norm/layer5": 11.25450748205185, "mean_norm/layer6": 9.165621161460876, "mean_norm/layer7": 9.554507315158844, "mean_norm/layer8": 9.916891932487488, "mean_norm/layer9": 9.86678010225296, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6500 }, { "epoch": 2.71, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4635580811460881, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.728681802749634, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9589, "eval_samples_per_second": 20.152, "eval_steps_per_second": 0.669, "step": 6500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.73, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.679, "max_norm": 26.300392150878906, "max_norm/layer0": 20.514989852905273, "max_norm/layer1": 21.97933006286621, "max_norm/layer10": 23.27261734008789, "max_norm/layer11": 21.926321029663086, "max_norm/layer12": 23.4990291595459, "max_norm/layer13": 20.39130210876465, "max_norm/layer14": 22.02625274658203, "max_norm/layer15": 25.556787490844727, "max_norm/layer16": 21.871458053588867, "max_norm/layer17": 25.401857376098633, "max_norm/layer18": 22.435489654541016, "max_norm/layer19": 22.1010684967041, "max_norm/layer2": 17.91828727722168, "max_norm/layer20": 23.372716903686523, "max_norm/layer21": 22.709657669067383, "max_norm/layer22": 23.478649139404297, "max_norm/layer23": 22.77086067199707, "max_norm/layer3": 21.2097110748291, "max_norm/layer4": 21.154205322265625, "max_norm/layer5": 26.300392150878906, "max_norm/layer6": 18.872074127197266, "max_norm/layer7": 22.68345832824707, "max_norm/layer8": 23.019010543823242, "max_norm/layer9": 22.39520263671875, "mean_norm": 10.065300052364668, "mean_norm/layer0": 9.591688811779022, "mean_norm/layer1": 9.60675710439682, "mean_norm/layer10": 9.95275890827179, "mean_norm/layer11": 10.185077250003815, "mean_norm/layer12": 10.55156809091568, "mean_norm/layer13": 9.919322490692139, "mean_norm/layer14": 10.236485064029694, "mean_norm/layer15": 10.468361973762512, "mean_norm/layer16": 10.004529654979706, "mean_norm/layer17": 10.407990336418152, "mean_norm/layer18": 10.069653689861298, "mean_norm/layer19": 10.098095178604126, "mean_norm/layer2": 8.650662422180176, "mean_norm/layer20": 10.203266143798828, "mean_norm/layer21": 10.156417906284332, "mean_norm/layer22": 10.903109967708588, "mean_norm/layer23": 10.854621052742004, "mean_norm/layer3": 10.368398368358612, "mean_norm/layer4": 9.529488384723663, "mean_norm/layer5": 11.272061467170715, "mean_norm/layer6": 9.17146784067154, "mean_norm/layer7": 9.562333583831787, "mean_norm/layer8": 9.926826179027557, "mean_norm/layer9": 9.87625938653946, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6550 }, { "epoch": 2.73, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46354591288335095, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7235679626464844, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9943, "eval_samples_per_second": 20.093, "eval_steps_per_second": 0.667, "step": 6550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.76, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6811, "max_norm": 26.41242790222168, "max_norm/layer0": 20.60313606262207, "max_norm/layer1": 22.07373046875, "max_norm/layer10": 23.349884033203125, "max_norm/layer11": 21.98993682861328, "max_norm/layer12": 23.584455490112305, "max_norm/layer13": 20.48732566833496, "max_norm/layer14": 22.116924285888672, "max_norm/layer15": 25.71857261657715, "max_norm/layer16": 21.94927978515625, "max_norm/layer17": 25.516101837158203, "max_norm/layer18": 22.543033599853516, "max_norm/layer19": 22.182836532592773, "max_norm/layer2": 17.969606399536133, "max_norm/layer20": 23.472898483276367, "max_norm/layer21": 22.797204971313477, "max_norm/layer22": 23.56959342956543, "max_norm/layer23": 22.859933853149414, "max_norm/layer3": 21.289579391479492, "max_norm/layer4": 21.220144271850586, "max_norm/layer5": 26.41242790222168, "max_norm/layer6": 18.920167922973633, "max_norm/layer7": 22.76586151123047, "max_norm/layer8": 23.115718841552734, "max_norm/layer9": 22.4892635345459, "mean_norm": 10.076057064036528, "mean_norm/layer0": 9.602395057678223, "mean_norm/layer1": 9.616295576095581, "mean_norm/layer10": 9.962799191474915, "mean_norm/layer11": 10.196372210979462, "mean_norm/layer12": 10.565538883209229, "mean_norm/layer13": 9.929556131362915, "mean_norm/layer14": 10.248076438903809, "mean_norm/layer15": 10.481202960014343, "mean_norm/layer16": 10.014976143836975, "mean_norm/layer17": 10.419837892055511, "mean_norm/layer18": 10.079734206199646, "mean_norm/layer19": 10.108431100845337, "mean_norm/layer2": 8.654021739959717, "mean_norm/layer20": 10.213871002197266, "mean_norm/layer21": 10.167028248310089, "mean_norm/layer22": 10.917715430259705, "mean_norm/layer23": 10.86873722076416, "mean_norm/layer3": 10.381210148334503, "mean_norm/layer4": 9.537363827228546, "mean_norm/layer5": 11.289835691452026, "mean_norm/layer6": 9.177374601364136, "mean_norm/layer7": 9.570362865924835, "mean_norm/layer8": 9.93681263923645, "mean_norm/layer9": 9.8858203291893, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6600 }, { "epoch": 2.76, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4633228280665036, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7256357669830322, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9601, "eval_samples_per_second": 21.989, "eval_steps_per_second": 0.73, "step": 6600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.78, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6643, "max_norm": 26.53062629699707, "max_norm/layer0": 20.69165802001953, "max_norm/layer1": 22.169431686401367, "max_norm/layer10": 23.433088302612305, "max_norm/layer11": 22.052358627319336, "max_norm/layer12": 23.695178985595703, "max_norm/layer13": 20.58042335510254, "max_norm/layer14": 22.196151733398438, "max_norm/layer15": 25.866147994995117, "max_norm/layer16": 22.042850494384766, "max_norm/layer17": 25.626388549804688, "max_norm/layer18": 22.655969619750977, "max_norm/layer19": 22.26487159729004, "max_norm/layer2": 18.044330596923828, "max_norm/layer20": 23.553281784057617, "max_norm/layer21": 22.87949562072754, "max_norm/layer22": 23.65622901916504, "max_norm/layer23": 22.95343589782715, "max_norm/layer3": 21.365331649780273, "max_norm/layer4": 21.279878616333008, "max_norm/layer5": 26.53062629699707, "max_norm/layer6": 18.96720314025879, "max_norm/layer7": 22.85620880126953, "max_norm/layer8": 23.207963943481445, "max_norm/layer9": 22.580841064453125, "mean_norm": 10.086789600551128, "mean_norm/layer0": 9.613000214099884, "mean_norm/layer1": 9.625762045383453, "mean_norm/layer10": 9.97273999452591, "mean_norm/layer11": 10.207618951797485, "mean_norm/layer12": 10.579367339611053, "mean_norm/layer13": 9.939832985401154, "mean_norm/layer14": 10.259712278842926, "mean_norm/layer15": 10.494081377983093, "mean_norm/layer16": 10.025314569473267, "mean_norm/layer17": 10.431630611419678, "mean_norm/layer18": 10.089784562587738, "mean_norm/layer19": 10.11875718832016, "mean_norm/layer2": 8.65731281042099, "mean_norm/layer20": 10.224305629730225, "mean_norm/layer21": 10.177746534347534, "mean_norm/layer22": 10.93244206905365, "mean_norm/layer23": 10.883185744285583, "mean_norm/layer3": 10.393769443035126, "mean_norm/layer4": 9.54505968093872, "mean_norm/layer5": 11.307492792606354, "mean_norm/layer6": 9.183353424072266, "mean_norm/layer7": 9.578372538089752, "mean_norm/layer8": 9.946847558021545, "mean_norm/layer9": 9.895460069179535, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6650 }, { "epoch": 2.78, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.464113765144417, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7235653400421143, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9913, "eval_samples_per_second": 21.927, "eval_steps_per_second": 0.728, "step": 6650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.8, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6876, "max_norm": 26.64914894104004, "max_norm/layer0": 20.784852981567383, "max_norm/layer1": 22.261592864990234, "max_norm/layer10": 23.51398277282715, "max_norm/layer11": 22.147192001342773, "max_norm/layer12": 23.818450927734375, "max_norm/layer13": 20.655099868774414, "max_norm/layer14": 22.267887115478516, "max_norm/layer15": 25.970462799072266, "max_norm/layer16": 22.135021209716797, "max_norm/layer17": 25.742647171020508, "max_norm/layer18": 22.75875473022461, "max_norm/layer19": 22.36121368408203, "max_norm/layer2": 18.096092224121094, "max_norm/layer20": 23.627822875976562, "max_norm/layer21": 22.97427749633789, "max_norm/layer22": 23.749114990234375, "max_norm/layer23": 23.046504974365234, "max_norm/layer3": 21.45503044128418, "max_norm/layer4": 21.35271453857422, "max_norm/layer5": 26.64914894104004, "max_norm/layer6": 19.017742156982422, "max_norm/layer7": 22.955495834350586, "max_norm/layer8": 23.273195266723633, "max_norm/layer9": 22.669376373291016, "mean_norm": 10.09744872401158, "mean_norm/layer0": 9.623487830162048, "mean_norm/layer1": 9.635239779949188, "mean_norm/layer10": 9.982640266418457, "mean_norm/layer11": 10.218821167945862, "mean_norm/layer12": 10.593107223510742, "mean_norm/layer13": 9.950129866600037, "mean_norm/layer14": 10.271190285682678, "mean_norm/layer15": 10.50691831111908, "mean_norm/layer16": 10.035589933395386, "mean_norm/layer17": 10.443416774272919, "mean_norm/layer18": 10.099798321723938, "mean_norm/layer19": 10.12911069393158, "mean_norm/layer2": 8.660598039627075, "mean_norm/layer20": 10.234609246253967, "mean_norm/layer21": 10.188297629356384, "mean_norm/layer22": 10.946758568286896, "mean_norm/layer23": 10.897278547286987, "mean_norm/layer3": 10.406484246253967, "mean_norm/layer4": 9.55282211303711, "mean_norm/layer5": 11.324999570846558, "mean_norm/layer6": 9.18930995464325, "mean_norm/layer7": 9.58632493019104, "mean_norm/layer8": 9.956737279891968, "mean_norm/layer9": 9.905098795890808, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6700 }, { "epoch": 2.8, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4638582316269373, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7227768898010254, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9561, "eval_samples_per_second": 20.157, "eval_steps_per_second": 0.669, "step": 6700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.82, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6642, "max_norm": 26.773120880126953, "max_norm/layer0": 20.875125885009766, "max_norm/layer1": 22.349252700805664, "max_norm/layer10": 23.591472625732422, "max_norm/layer11": 22.24338150024414, "max_norm/layer12": 23.943801879882812, "max_norm/layer13": 20.728654861450195, "max_norm/layer14": 22.363893508911133, "max_norm/layer15": 26.09659194946289, "max_norm/layer16": 22.210033416748047, "max_norm/layer17": 25.849321365356445, "max_norm/layer18": 22.857954025268555, "max_norm/layer19": 22.457433700561523, "max_norm/layer2": 18.137813568115234, "max_norm/layer20": 23.715415954589844, "max_norm/layer21": 23.066875457763672, "max_norm/layer22": 23.838668823242188, "max_norm/layer23": 23.13340950012207, "max_norm/layer3": 21.559398651123047, "max_norm/layer4": 21.422008514404297, "max_norm/layer5": 26.773120880126953, "max_norm/layer6": 19.059314727783203, "max_norm/layer7": 23.055139541625977, "max_norm/layer8": 23.34084701538086, "max_norm/layer9": 22.744380950927734, "mean_norm": 10.108140423893929, "mean_norm/layer0": 9.634041845798492, "mean_norm/layer1": 9.64472496509552, "mean_norm/layer10": 9.992616534233093, "mean_norm/layer11": 10.230005323886871, "mean_norm/layer12": 10.606897294521332, "mean_norm/layer13": 9.960363149642944, "mean_norm/layer14": 10.282639801502228, "mean_norm/layer15": 10.519710779190063, "mean_norm/layer16": 10.045837819576263, "mean_norm/layer17": 10.455260336399078, "mean_norm/layer18": 10.109922409057617, "mean_norm/layer19": 10.13957166671753, "mean_norm/layer2": 8.663931012153625, "mean_norm/layer20": 10.244955360889435, "mean_norm/layer21": 10.198612809181213, "mean_norm/layer22": 10.961101591587067, "mean_norm/layer23": 10.911440670490265, "mean_norm/layer3": 10.419304966926575, "mean_norm/layer4": 9.560689806938171, "mean_norm/layer5": 11.342604517936707, "mean_norm/layer6": 9.19537079334259, "mean_norm/layer7": 9.594294905662537, "mean_norm/layer8": 9.96668291091919, "mean_norm/layer9": 9.914788901805878, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6750 }, { "epoch": 2.82, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46477896350738007, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.719167470932007, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9754, "eval_samples_per_second": 20.125, "eval_steps_per_second": 0.668, "step": 6750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.84, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6727, "max_norm": 26.90037727355957, "max_norm/layer0": 20.969045639038086, "max_norm/layer1": 22.430818557739258, "max_norm/layer10": 23.685087203979492, "max_norm/layer11": 22.313629150390625, "max_norm/layer12": 24.071069717407227, "max_norm/layer13": 20.809654235839844, "max_norm/layer14": 22.459442138671875, "max_norm/layer15": 26.201696395874023, "max_norm/layer16": 22.303298950195312, "max_norm/layer17": 25.975738525390625, "max_norm/layer18": 22.961307525634766, "max_norm/layer19": 22.554285049438477, "max_norm/layer2": 18.194622039794922, "max_norm/layer20": 23.812129974365234, "max_norm/layer21": 23.155019760131836, "max_norm/layer22": 23.927391052246094, "max_norm/layer23": 23.213560104370117, "max_norm/layer3": 21.650287628173828, "max_norm/layer4": 21.503629684448242, "max_norm/layer5": 26.90037727355957, "max_norm/layer6": 19.09876251220703, "max_norm/layer7": 23.141084671020508, "max_norm/layer8": 23.412324905395508, "max_norm/layer9": 22.814966201782227, "mean_norm": 10.118629676600298, "mean_norm/layer0": 9.644381642341614, "mean_norm/layer1": 9.654210925102234, "mean_norm/layer10": 10.002406060695648, "mean_norm/layer11": 10.240853428840637, "mean_norm/layer12": 10.620422959327698, "mean_norm/layer13": 9.970386505126953, "mean_norm/layer14": 10.293885469436646, "mean_norm/layer15": 10.53236836194992, "mean_norm/layer16": 10.055989801883698, "mean_norm/layer17": 10.4669588804245, "mean_norm/layer18": 10.119860827922821, "mean_norm/layer19": 10.14971262216568, "mean_norm/layer2": 8.667130768299103, "mean_norm/layer20": 10.255202949047089, "mean_norm/layer21": 10.208835124969482, "mean_norm/layer22": 10.975344359874725, "mean_norm/layer23": 10.925430059432983, "mean_norm/layer3": 10.431658208370209, "mean_norm/layer4": 9.568336188793182, "mean_norm/layer5": 11.35985416173935, "mean_norm/layer6": 9.201176106929779, "mean_norm/layer7": 9.60221016407013, "mean_norm/layer8": 9.976355135440826, "mean_norm/layer9": 9.924141526222229, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6800 }, { "epoch": 2.84, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46521296487833763, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7178404331207275, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 12.0017, "eval_samples_per_second": 20.08, "eval_steps_per_second": 0.667, "step": 6800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.86, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6807, "max_norm": 27.022308349609375, "max_norm/layer0": 21.06038475036621, "max_norm/layer1": 22.520341873168945, "max_norm/layer10": 23.770435333251953, "max_norm/layer11": 22.414648056030273, "max_norm/layer12": 24.182048797607422, "max_norm/layer13": 20.879291534423828, "max_norm/layer14": 22.538923263549805, "max_norm/layer15": 26.301652908325195, "max_norm/layer16": 22.408843994140625, "max_norm/layer17": 26.084640502929688, "max_norm/layer18": 23.061779022216797, "max_norm/layer19": 22.65226936340332, "max_norm/layer2": 18.260866165161133, "max_norm/layer20": 23.915470123291016, "max_norm/layer21": 23.253692626953125, "max_norm/layer22": 24.023237228393555, "max_norm/layer23": 23.293275833129883, "max_norm/layer3": 21.75033187866211, "max_norm/layer4": 21.58634376525879, "max_norm/layer5": 27.022308349609375, "max_norm/layer6": 19.1436824798584, "max_norm/layer7": 23.238664627075195, "max_norm/layer8": 23.49786949157715, "max_norm/layer9": 22.880979537963867, "mean_norm": 10.129067420959473, "mean_norm/layer0": 9.65470838546753, "mean_norm/layer1": 9.663567900657654, "mean_norm/layer10": 10.012172758579254, "mean_norm/layer11": 10.251695156097412, "mean_norm/layer12": 10.633814513683319, "mean_norm/layer13": 9.980302691459656, "mean_norm/layer14": 10.304986953735352, "mean_norm/layer15": 10.544901430606842, "mean_norm/layer16": 10.066105425357819, "mean_norm/layer17": 10.478527903556824, "mean_norm/layer18": 10.129638016223907, "mean_norm/layer19": 10.159819066524506, "mean_norm/layer2": 8.67033064365387, "mean_norm/layer20": 10.265411257743835, "mean_norm/layer21": 10.219161748886108, "mean_norm/layer22": 10.989376246929169, "mean_norm/layer23": 10.939277946949005, "mean_norm/layer3": 10.444223880767822, "mean_norm/layer4": 9.575941681861877, "mean_norm/layer5": 11.377063035964966, "mean_norm/layer6": 9.207095921039581, "mean_norm/layer7": 9.61001867055893, "mean_norm/layer8": 9.98603469133377, "mean_norm/layer9": 9.933442175388336, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6850 }, { "epoch": 2.86, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46436524257431766, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7178053855895996, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 12.0365, "eval_samples_per_second": 20.022, "eval_steps_per_second": 0.665, "step": 6850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.88, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6681, "max_norm": 27.13735580444336, "max_norm/layer0": 21.155269622802734, "max_norm/layer1": 22.60647964477539, "max_norm/layer10": 23.85950469970703, "max_norm/layer11": 22.502986907958984, "max_norm/layer12": 24.27869415283203, "max_norm/layer13": 20.957544326782227, "max_norm/layer14": 22.631610870361328, "max_norm/layer15": 26.41908836364746, "max_norm/layer16": 22.488388061523438, "max_norm/layer17": 26.20008659362793, "max_norm/layer18": 23.15396499633789, "max_norm/layer19": 22.744834899902344, "max_norm/layer2": 18.32578468322754, "max_norm/layer20": 24.02092933654785, "max_norm/layer21": 23.352216720581055, "max_norm/layer22": 24.124401092529297, "max_norm/layer23": 23.385162353515625, "max_norm/layer3": 21.84356117248535, "max_norm/layer4": 21.661521911621094, "max_norm/layer5": 27.13735580444336, "max_norm/layer6": 19.194093704223633, "max_norm/layer7": 23.325639724731445, "max_norm/layer8": 23.56928253173828, "max_norm/layer9": 22.95269203186035, "mean_norm": 10.139540493488312, "mean_norm/layer0": 9.665144145488739, "mean_norm/layer1": 9.672926366329193, "mean_norm/layer10": 10.022092461585999, "mean_norm/layer11": 10.262580275535583, "mean_norm/layer12": 10.647343635559082, "mean_norm/layer13": 9.990399658679962, "mean_norm/layer14": 10.316211938858032, "mean_norm/layer15": 10.557567954063416, "mean_norm/layer16": 10.07616525888443, "mean_norm/layer17": 10.490152776241302, "mean_norm/layer18": 10.139376282691956, "mean_norm/layer19": 10.169822752475739, "mean_norm/layer2": 8.673572421073914, "mean_norm/layer20": 10.275636315345764, "mean_norm/layer21": 10.229391396045685, "mean_norm/layer22": 11.003340423107147, "mean_norm/layer23": 10.952987730503082, "mean_norm/layer3": 10.456810116767883, "mean_norm/layer4": 9.58361804485321, "mean_norm/layer5": 11.394310891628265, "mean_norm/layer6": 9.212887942790985, "mean_norm/layer7": 9.617939710617065, "mean_norm/layer8": 9.995769262313843, "mean_norm/layer9": 9.942924082279205, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6900 }, { "epoch": 2.88, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46391096076546484, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7232961654663086, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9728, "eval_samples_per_second": 20.129, "eval_steps_per_second": 0.668, "step": 6900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.9, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.683, "max_norm": 27.246826171875, "max_norm/layer0": 21.23979949951172, "max_norm/layer1": 22.690458297729492, "max_norm/layer10": 23.941022872924805, "max_norm/layer11": 22.600021362304688, "max_norm/layer12": 24.37978744506836, "max_norm/layer13": 21.041887283325195, "max_norm/layer14": 22.723411560058594, "max_norm/layer15": 26.524131774902344, "max_norm/layer16": 22.572383880615234, "max_norm/layer17": 26.303722381591797, "max_norm/layer18": 23.273639678955078, "max_norm/layer19": 22.84536361694336, "max_norm/layer2": 18.371814727783203, "max_norm/layer20": 24.109756469726562, "max_norm/layer21": 23.438453674316406, "max_norm/layer22": 24.226545333862305, "max_norm/layer23": 23.486717224121094, "max_norm/layer3": 21.92794418334961, "max_norm/layer4": 21.739208221435547, "max_norm/layer5": 27.246826171875, "max_norm/layer6": 19.241615295410156, "max_norm/layer7": 23.398082733154297, "max_norm/layer8": 23.666467666625977, "max_norm/layer9": 23.0317325592041, "mean_norm": 10.149980219701925, "mean_norm/layer0": 9.675594747066498, "mean_norm/layer1": 9.682190597057343, "mean_norm/layer10": 10.031827569007874, "mean_norm/layer11": 10.273438334465027, "mean_norm/layer12": 10.660808444023132, "mean_norm/layer13": 10.000330448150635, "mean_norm/layer14": 10.327272832393646, "mean_norm/layer15": 10.57010704278946, "mean_norm/layer16": 10.08619076013565, "mean_norm/layer17": 10.501644492149353, "mean_norm/layer18": 10.1490837931633, "mean_norm/layer19": 10.179917216300964, "mean_norm/layer2": 8.676787793636322, "mean_norm/layer20": 10.285813570022583, "mean_norm/layer21": 10.239711225032806, "mean_norm/layer22": 11.01748389005661, "mean_norm/layer23": 10.966828763484955, "mean_norm/layer3": 10.469435572624207, "mean_norm/layer4": 9.591278553009033, "mean_norm/layer5": 11.41142475605011, "mean_norm/layer6": 9.218688607215881, "mean_norm/layer7": 9.625806748867035, "mean_norm/layer8": 10.005479514598846, "mean_norm/layer9": 9.952380001544952, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 6950 }, { "epoch": 2.9, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46421111124631403, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7184746265411377, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9605, "eval_samples_per_second": 20.15, "eval_steps_per_second": 0.669, "step": 6950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.92, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6739, "max_norm": 27.365013122558594, "max_norm/layer0": 21.320209503173828, "max_norm/layer1": 22.772533416748047, "max_norm/layer10": 24.037193298339844, "max_norm/layer11": 22.68212890625, "max_norm/layer12": 24.47044563293457, "max_norm/layer13": 21.140518188476562, "max_norm/layer14": 22.791292190551758, "max_norm/layer15": 26.62784194946289, "max_norm/layer16": 22.64996910095215, "max_norm/layer17": 26.407562255859375, "max_norm/layer18": 23.370203018188477, "max_norm/layer19": 22.947025299072266, "max_norm/layer2": 18.42116355895996, "max_norm/layer20": 24.20484733581543, "max_norm/layer21": 23.53941535949707, "max_norm/layer22": 24.325706481933594, "max_norm/layer23": 23.589479446411133, "max_norm/layer3": 21.999433517456055, "max_norm/layer4": 21.819570541381836, "max_norm/layer5": 27.365013122558594, "max_norm/layer6": 19.291427612304688, "max_norm/layer7": 23.481708526611328, "max_norm/layer8": 23.764585494995117, "max_norm/layer9": 23.106569290161133, "mean_norm": 10.160274868210157, "mean_norm/layer0": 9.685955584049225, "mean_norm/layer1": 9.691339433193207, "mean_norm/layer10": 10.041491627693176, "mean_norm/layer11": 10.284164071083069, "mean_norm/layer12": 10.674180507659912, "mean_norm/layer13": 10.010160326957703, "mean_norm/layer14": 10.338261485099792, "mean_norm/layer15": 10.582512021064758, "mean_norm/layer16": 10.096154391765594, "mean_norm/layer17": 10.513055503368378, "mean_norm/layer18": 10.158551752567291, "mean_norm/layer19": 10.189700782299042, "mean_norm/layer2": 8.67995148897171, "mean_norm/layer20": 10.295816540718079, "mean_norm/layer21": 10.249844431877136, "mean_norm/layer22": 11.031257331371307, "mean_norm/layer23": 10.980518758296967, "mean_norm/layer3": 10.481708467006683, "mean_norm/layer4": 9.598879992961884, "mean_norm/layer5": 11.428387343883514, "mean_norm/layer6": 9.224398612976074, "mean_norm/layer7": 9.633533835411072, "mean_norm/layer8": 10.015078723430634, "mean_norm/layer9": 9.961693823337555, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7000 }, { "epoch": 2.92, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4648519730838028, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.71905255317688, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 12.0164, "eval_samples_per_second": 20.056, "eval_steps_per_second": 0.666, "step": 7000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.94, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6601, "max_norm": 27.486360549926758, "max_norm/layer0": 21.405040740966797, "max_norm/layer1": 22.844478607177734, "max_norm/layer10": 24.13811683654785, "max_norm/layer11": 22.76434326171875, "max_norm/layer12": 24.57598304748535, "max_norm/layer13": 21.21640396118164, "max_norm/layer14": 22.89393424987793, "max_norm/layer15": 26.729122161865234, "max_norm/layer16": 22.737476348876953, "max_norm/layer17": 26.515493392944336, "max_norm/layer18": 23.493305206298828, "max_norm/layer19": 23.048307418823242, "max_norm/layer2": 18.475828170776367, "max_norm/layer20": 24.307435989379883, "max_norm/layer21": 23.62061882019043, "max_norm/layer22": 24.448505401611328, "max_norm/layer23": 23.68608856201172, "max_norm/layer3": 22.074338912963867, "max_norm/layer4": 21.888811111450195, "max_norm/layer5": 27.486360549926758, "max_norm/layer6": 19.338953018188477, "max_norm/layer7": 23.5861759185791, "max_norm/layer8": 23.85187530517578, "max_norm/layer9": 23.19942855834961, "mean_norm": 10.170738401512304, "mean_norm/layer0": 9.69635421037674, "mean_norm/layer1": 9.700594305992126, "mean_norm/layer10": 10.051340162754059, "mean_norm/layer11": 10.295095443725586, "mean_norm/layer12": 10.687723755836487, "mean_norm/layer13": 10.02021598815918, "mean_norm/layer14": 10.349409282207489, "mean_norm/layer15": 10.595264911651611, "mean_norm/layer16": 10.106310904026031, "mean_norm/layer17": 10.52473098039627, "mean_norm/layer18": 10.168320178985596, "mean_norm/layer19": 10.199616312980652, "mean_norm/layer2": 8.683153092861176, "mean_norm/layer20": 10.306044220924377, "mean_norm/layer21": 10.260170817375183, "mean_norm/layer22": 11.045268595218658, "mean_norm/layer23": 10.994395852088928, "mean_norm/layer3": 10.494205713272095, "mean_norm/layer4": 9.606450021266937, "mean_norm/layer5": 11.445621371269226, "mean_norm/layer6": 9.230290651321411, "mean_norm/layer7": 9.641353845596313, "mean_norm/layer8": 10.02471512556076, "mean_norm/layer9": 9.971075892448425, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7050 }, { "epoch": 2.94, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46439769127495, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7168571949005127, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8316, "eval_samples_per_second": 20.369, "eval_steps_per_second": 0.676, "step": 7050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.96, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.675, "max_norm": 27.602540969848633, "max_norm/layer0": 21.484041213989258, "max_norm/layer1": 22.924697875976562, "max_norm/layer10": 24.247194290161133, "max_norm/layer11": 22.84771156311035, "max_norm/layer12": 24.685514450073242, "max_norm/layer13": 21.300878524780273, "max_norm/layer14": 22.97532844543457, "max_norm/layer15": 26.83058738708496, "max_norm/layer16": 22.808544158935547, "max_norm/layer17": 26.614301681518555, "max_norm/layer18": 23.6390323638916, "max_norm/layer19": 23.148977279663086, "max_norm/layer2": 18.52928352355957, "max_norm/layer20": 24.404052734375, "max_norm/layer21": 23.719820022583008, "max_norm/layer22": 24.551822662353516, "max_norm/layer23": 23.78716468811035, "max_norm/layer3": 22.14638900756836, "max_norm/layer4": 21.958269119262695, "max_norm/layer5": 27.602540969848633, "max_norm/layer6": 19.384769439697266, "max_norm/layer7": 23.659626007080078, "max_norm/layer8": 23.928421020507812, "max_norm/layer9": 23.31978416442871, "mean_norm": 10.181060957411924, "mean_norm/layer0": 9.706688940525055, "mean_norm/layer1": 9.709847152233124, "mean_norm/layer10": 10.061019718647003, "mean_norm/layer11": 10.305987536907196, "mean_norm/layer12": 10.701012432575226, "mean_norm/layer13": 10.030164241790771, "mean_norm/layer14": 10.360415279865265, "mean_norm/layer15": 10.607886254787445, "mean_norm/layer16": 10.116294264793396, "mean_norm/layer17": 10.536153733730316, "mean_norm/layer18": 10.177928388118744, "mean_norm/layer19": 10.209418177604675, "mean_norm/layer2": 8.686349153518677, "mean_norm/layer20": 10.316045820713043, "mean_norm/layer21": 10.270420730113983, "mean_norm/layer22": 11.059071898460388, "mean_norm/layer23": 11.008045971393585, "mean_norm/layer3": 10.50650441646576, "mean_norm/layer4": 9.613870918750763, "mean_norm/layer5": 11.462700128555298, "mean_norm/layer6": 9.236022472381592, "mean_norm/layer7": 9.649041473865509, "mean_norm/layer8": 10.034249007701874, "mean_norm/layer9": 9.980324864387512, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7100 }, { "epoch": 2.96, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.465622629723821, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.714928388595581, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8305, "eval_samples_per_second": 20.371, "eval_steps_per_second": 0.676, "step": 7100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 2.99, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6726, "max_norm": 27.709001541137695, "max_norm/layer0": 21.556224822998047, "max_norm/layer1": 23.0113525390625, "max_norm/layer10": 24.326719284057617, "max_norm/layer11": 22.943187713623047, "max_norm/layer12": 24.772979736328125, "max_norm/layer13": 21.37757110595703, "max_norm/layer14": 23.051734924316406, "max_norm/layer15": 26.927146911621094, "max_norm/layer16": 22.884979248046875, "max_norm/layer17": 26.728662490844727, "max_norm/layer18": 23.741443634033203, "max_norm/layer19": 23.258390426635742, "max_norm/layer2": 18.579376220703125, "max_norm/layer20": 24.51500701904297, "max_norm/layer21": 23.80166244506836, "max_norm/layer22": 24.64849281311035, "max_norm/layer23": 23.88472557067871, "max_norm/layer3": 22.230770111083984, "max_norm/layer4": 22.012615203857422, "max_norm/layer5": 27.709001541137695, "max_norm/layer6": 19.437652587890625, "max_norm/layer7": 23.738452911376953, "max_norm/layer8": 23.992197036743164, "max_norm/layer9": 23.42462158203125, "mean_norm": 10.191307773192724, "mean_norm/layer0": 9.716896176338196, "mean_norm/layer1": 9.718885600566864, "mean_norm/layer10": 10.07063364982605, "mean_norm/layer11": 10.316668629646301, "mean_norm/layer12": 10.714253962039948, "mean_norm/layer13": 10.039902150630951, "mean_norm/layer14": 10.371422827243805, "mean_norm/layer15": 10.620187282562256, "mean_norm/layer16": 10.126117765903473, "mean_norm/layer17": 10.547522008419037, "mean_norm/layer18": 10.187499582767487, "mean_norm/layer19": 10.219323873519897, "mean_norm/layer2": 8.689531564712524, "mean_norm/layer20": 10.326024532318115, "mean_norm/layer21": 10.280332446098328, "mean_norm/layer22": 11.072968006134033, "mean_norm/layer23": 11.021589159965515, "mean_norm/layer3": 10.518806040287018, "mean_norm/layer4": 9.621297419071198, "mean_norm/layer5": 11.47957170009613, "mean_norm/layer6": 9.241807997226715, "mean_norm/layer7": 9.656856834888458, "mean_norm/layer8": 10.043777287006378, "mean_norm/layer9": 9.98951005935669, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7150 }, { "epoch": 2.99, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46464105652969256, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7129509449005127, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9382, "eval_samples_per_second": 22.033, "eval_steps_per_second": 0.731, "step": 7150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.01, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.6093, "max_norm": 27.824810028076172, "max_norm/layer0": 21.625444412231445, "max_norm/layer1": 23.094030380249023, "max_norm/layer10": 24.410734176635742, "max_norm/layer11": 23.041915893554688, "max_norm/layer12": 24.885108947753906, "max_norm/layer13": 21.451623916625977, "max_norm/layer14": 23.14749526977539, "max_norm/layer15": 27.040794372558594, "max_norm/layer16": 22.965412139892578, "max_norm/layer17": 26.842836380004883, "max_norm/layer18": 23.85369300842285, "max_norm/layer19": 23.35756492614746, "max_norm/layer2": 18.625410079956055, "max_norm/layer20": 24.62005043029785, "max_norm/layer21": 23.91094207763672, "max_norm/layer22": 24.742820739746094, "max_norm/layer23": 23.971527099609375, "max_norm/layer3": 22.325895309448242, "max_norm/layer4": 22.078996658325195, "max_norm/layer5": 27.824810028076172, "max_norm/layer6": 19.494665145874023, "max_norm/layer7": 23.832578659057617, "max_norm/layer8": 24.08106803894043, "max_norm/layer9": 23.532432556152344, "mean_norm": 10.201683916151524, "mean_norm/layer0": 9.727182745933533, "mean_norm/layer1": 9.728063941001892, "mean_norm/layer10": 10.080385386943817, "mean_norm/layer11": 10.327516376972198, "mean_norm/layer12": 10.727601408958435, "mean_norm/layer13": 10.049872696399689, "mean_norm/layer14": 10.382597625255585, "mean_norm/layer15": 10.632773756980896, "mean_norm/layer16": 10.136172950267792, "mean_norm/layer17": 10.559046685695648, "mean_norm/layer18": 10.19717562198639, "mean_norm/layer19": 10.229287981987, "mean_norm/layer2": 8.692719519138336, "mean_norm/layer20": 10.336449027061462, "mean_norm/layer21": 10.290430724620819, "mean_norm/layer22": 11.086778223514557, "mean_norm/layer23": 11.035368502140045, "mean_norm/layer3": 10.53110146522522, "mean_norm/layer4": 9.628753662109375, "mean_norm/layer5": 11.49661272764206, "mean_norm/layer6": 9.247560143470764, "mean_norm/layer7": 9.664614796638489, "mean_norm/layer8": 10.053438544273376, "mean_norm/layer9": 9.99890947341919, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7200 }, { "epoch": 3.01, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46351346418271866, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7328038215637207, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9734, "eval_samples_per_second": 20.128, "eval_steps_per_second": 0.668, "step": 7200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.03, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4824, "max_norm": 27.938352584838867, "max_norm/layer0": 21.70029640197754, "max_norm/layer1": 23.16924476623535, "max_norm/layer10": 24.499082565307617, "max_norm/layer11": 23.14937400817871, "max_norm/layer12": 24.984052658081055, "max_norm/layer13": 21.552579879760742, "max_norm/layer14": 23.241153717041016, "max_norm/layer15": 27.157886505126953, "max_norm/layer16": 23.04047393798828, "max_norm/layer17": 26.968616485595703, "max_norm/layer18": 23.939163208007812, "max_norm/layer19": 23.467212677001953, "max_norm/layer2": 18.67315673828125, "max_norm/layer20": 24.7244873046875, "max_norm/layer21": 24.00645637512207, "max_norm/layer22": 24.86109161376953, "max_norm/layer23": 24.05797004699707, "max_norm/layer3": 22.41858673095703, "max_norm/layer4": 22.14661979675293, "max_norm/layer5": 27.938352584838867, "max_norm/layer6": 19.537410736083984, "max_norm/layer7": 23.92576026916504, "max_norm/layer8": 24.154558181762695, "max_norm/layer9": 23.64275550842285, "mean_norm": 10.212615164617697, "mean_norm/layer0": 9.738060355186462, "mean_norm/layer1": 9.737515270709991, "mean_norm/layer10": 10.090328097343445, "mean_norm/layer11": 10.338834047317505, "mean_norm/layer12": 10.741642594337463, "mean_norm/layer13": 10.060389280319214, "mean_norm/layer14": 10.394351184368134, "mean_norm/layer15": 10.646148383617401, "mean_norm/layer16": 10.14692997932434, "mean_norm/layer17": 10.571349322795868, "mean_norm/layer18": 10.207534611225128, "mean_norm/layer19": 10.240472435951233, "mean_norm/layer2": 8.696077167987823, "mean_norm/layer20": 10.347783148288727, "mean_norm/layer21": 10.30154174566269, "mean_norm/layer22": 11.101174712181091, "mean_norm/layer23": 11.049887597560883, "mean_norm/layer3": 10.543985962867737, "mean_norm/layer4": 9.636641085147858, "mean_norm/layer5": 11.513911306858063, "mean_norm/layer6": 9.253595232963562, "mean_norm/layer7": 9.67268419265747, "mean_norm/layer8": 10.063383936882019, "mean_norm/layer9": 10.00854229927063, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7250 }, { "epoch": 3.03, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46372032464924984, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.735767364501953, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8416, "eval_samples_per_second": 20.352, "eval_steps_per_second": 0.676, "step": 7250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.05, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4742, "max_norm": 28.060808181762695, "max_norm/layer0": 21.76616668701172, "max_norm/layer1": 23.24862289428711, "max_norm/layer10": 24.570327758789062, "max_norm/layer11": 23.24647331237793, "max_norm/layer12": 25.09784698486328, "max_norm/layer13": 21.668365478515625, "max_norm/layer14": 23.325544357299805, "max_norm/layer15": 27.291521072387695, "max_norm/layer16": 23.135894775390625, "max_norm/layer17": 27.086589813232422, "max_norm/layer18": 24.027212142944336, "max_norm/layer19": 23.55608558654785, "max_norm/layer2": 18.72525978088379, "max_norm/layer20": 24.830610275268555, "max_norm/layer21": 24.100738525390625, "max_norm/layer22": 24.97201156616211, "max_norm/layer23": 24.144886016845703, "max_norm/layer3": 22.505525588989258, "max_norm/layer4": 22.22715950012207, "max_norm/layer5": 28.060808181762695, "max_norm/layer6": 19.58978843688965, "max_norm/layer7": 24.01059913635254, "max_norm/layer8": 24.2260799407959, "max_norm/layer9": 23.773536682128906, "mean_norm": 10.223552122712135, "mean_norm/layer0": 9.749425172805786, "mean_norm/layer1": 9.747048020362854, "mean_norm/layer10": 10.100198149681091, "mean_norm/layer11": 10.350200355052948, "mean_norm/layer12": 10.755703628063202, "mean_norm/layer13": 10.07078105211258, "mean_norm/layer14": 10.406133830547333, "mean_norm/layer15": 10.659375131130219, "mean_norm/layer16": 10.157630205154419, "mean_norm/layer17": 10.583497643470764, "mean_norm/layer18": 10.21798974275589, "mean_norm/layer19": 10.251213431358337, "mean_norm/layer2": 8.699485063552856, "mean_norm/layer20": 10.359046816825867, "mean_norm/layer21": 10.312615513801575, "mean_norm/layer22": 11.115482449531555, "mean_norm/layer23": 11.064455330371857, "mean_norm/layer3": 10.557074010372162, "mean_norm/layer4": 9.644611239433289, "mean_norm/layer5": 11.531232297420502, "mean_norm/layer6": 9.25971406698227, "mean_norm/layer7": 9.680716574192047, "mean_norm/layer8": 10.073291182518005, "mean_norm/layer9": 10.018330037593842, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7300 }, { "epoch": 3.05, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4618301878374158, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7427256107330322, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8228, "eval_samples_per_second": 20.384, "eval_steps_per_second": 0.677, "step": 7300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.07, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4903, "max_norm": 28.1783390045166, "max_norm/layer0": 21.83902931213379, "max_norm/layer1": 23.328245162963867, "max_norm/layer10": 24.659210205078125, "max_norm/layer11": 23.3525333404541, "max_norm/layer12": 25.218076705932617, "max_norm/layer13": 21.76858139038086, "max_norm/layer14": 23.42473793029785, "max_norm/layer15": 27.404930114746094, "max_norm/layer16": 23.211116790771484, "max_norm/layer17": 27.211097717285156, "max_norm/layer18": 24.133827209472656, "max_norm/layer19": 23.656211853027344, "max_norm/layer2": 18.778493881225586, "max_norm/layer20": 24.922006607055664, "max_norm/layer21": 24.207969665527344, "max_norm/layer22": 25.06915283203125, "max_norm/layer23": 24.239763259887695, "max_norm/layer3": 22.60003089904785, "max_norm/layer4": 22.29958152770996, "max_norm/layer5": 28.1783390045166, "max_norm/layer6": 19.645545959472656, "max_norm/layer7": 24.08893585205078, "max_norm/layer8": 24.30266761779785, "max_norm/layer9": 23.877931594848633, "mean_norm": 10.234688145418962, "mean_norm/layer0": 9.761431992053986, "mean_norm/layer1": 9.756781339645386, "mean_norm/layer10": 10.110297739505768, "mean_norm/layer11": 10.361783504486084, "mean_norm/layer12": 10.770005881786346, "mean_norm/layer13": 10.08151239156723, "mean_norm/layer14": 10.418040454387665, "mean_norm/layer15": 10.672817826271057, "mean_norm/layer16": 10.168405294418335, "mean_norm/layer17": 10.595774412155151, "mean_norm/layer18": 10.22852224111557, "mean_norm/layer19": 10.262270987033844, "mean_norm/layer2": 8.702980160713196, "mean_norm/layer20": 10.370457172393799, "mean_norm/layer21": 10.323876857757568, "mean_norm/layer22": 11.13010424375534, "mean_norm/layer23": 11.079138576984406, "mean_norm/layer3": 10.570332705974579, "mean_norm/layer4": 9.652642965316772, "mean_norm/layer5": 11.548939108848572, "mean_norm/layer6": 9.265985012054443, "mean_norm/layer7": 9.688855290412903, "mean_norm/layer8": 10.083318591117859, "mean_norm/layer9": 10.028240740299225, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7350 }, { "epoch": 3.07, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4628604340824927, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.739495277404785, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9483, "eval_samples_per_second": 22.013, "eval_steps_per_second": 0.731, "step": 7350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.09, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5219, "max_norm": 28.30512046813965, "max_norm/layer0": 21.925140380859375, "max_norm/layer1": 23.402666091918945, "max_norm/layer10": 24.75094223022461, "max_norm/layer11": 23.466140747070312, "max_norm/layer12": 25.3124942779541, "max_norm/layer13": 21.85954475402832, "max_norm/layer14": 23.502534866333008, "max_norm/layer15": 27.527902603149414, "max_norm/layer16": 23.29158592224121, "max_norm/layer17": 27.323348999023438, "max_norm/layer18": 24.239091873168945, "max_norm/layer19": 23.75176239013672, "max_norm/layer2": 18.829025268554688, "max_norm/layer20": 25.023799896240234, "max_norm/layer21": 24.31355094909668, "max_norm/layer22": 25.157793045043945, "max_norm/layer23": 24.331005096435547, "max_norm/layer3": 22.704940795898438, "max_norm/layer4": 22.374662399291992, "max_norm/layer5": 28.30512046813965, "max_norm/layer6": 19.703712463378906, "max_norm/layer7": 24.16960906982422, "max_norm/layer8": 24.37641143798828, "max_norm/layer9": 23.971576690673828, "mean_norm": 10.245796350141367, "mean_norm/layer0": 9.773649513721466, "mean_norm/layer1": 9.76639074087143, "mean_norm/layer10": 10.12041312456131, "mean_norm/layer11": 10.373321115970612, "mean_norm/layer12": 10.784271001815796, "mean_norm/layer13": 10.09208732843399, "mean_norm/layer14": 10.429891586303711, "mean_norm/layer15": 10.686288714408875, "mean_norm/layer16": 10.17914080619812, "mean_norm/layer17": 10.608086168766022, "mean_norm/layer18": 10.238989114761353, "mean_norm/layer19": 10.273307204246521, "mean_norm/layer2": 8.706504940986633, "mean_norm/layer20": 10.381437599658966, "mean_norm/layer21": 10.334827601909637, "mean_norm/layer22": 11.144693374633789, "mean_norm/layer23": 11.09385484457016, "mean_norm/layer3": 10.583644211292267, "mean_norm/layer4": 9.66067487001419, "mean_norm/layer5": 11.566678524017334, "mean_norm/layer6": 9.272311866283417, "mean_norm/layer7": 9.697041988372803, "mean_norm/layer8": 10.093447387218475, "mean_norm/layer9": 10.038158774375916, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7400 }, { "epoch": 3.09, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4631037993372353, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7434771060943604, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9589, "eval_samples_per_second": 20.152, "eval_steps_per_second": 0.669, "step": 7400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.11, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5297, "max_norm": 28.41901206970215, "max_norm/layer0": 21.99617576599121, "max_norm/layer1": 23.478212356567383, "max_norm/layer10": 24.831113815307617, "max_norm/layer11": 23.557214736938477, "max_norm/layer12": 25.407339096069336, "max_norm/layer13": 21.933692932128906, "max_norm/layer14": 23.58243179321289, "max_norm/layer15": 27.664417266845703, "max_norm/layer16": 23.40688133239746, "max_norm/layer17": 27.449398040771484, "max_norm/layer18": 24.320056915283203, "max_norm/layer19": 23.8420467376709, "max_norm/layer2": 18.881885528564453, "max_norm/layer20": 25.124309539794922, "max_norm/layer21": 24.40587043762207, "max_norm/layer22": 25.251537322998047, "max_norm/layer23": 24.414310455322266, "max_norm/layer3": 22.804298400878906, "max_norm/layer4": 22.448192596435547, "max_norm/layer5": 28.41901206970215, "max_norm/layer6": 19.762104034423828, "max_norm/layer7": 24.261402130126953, "max_norm/layer8": 24.460205078125, "max_norm/layer9": 24.068944931030273, "mean_norm": 10.256785544256369, "mean_norm/layer0": 9.786031067371368, "mean_norm/layer1": 9.776026725769043, "mean_norm/layer10": 10.13040566444397, "mean_norm/layer11": 10.384915590286255, "mean_norm/layer12": 10.798379123210907, "mean_norm/layer13": 10.102573335170746, "mean_norm/layer14": 10.441614508628845, "mean_norm/layer15": 10.699365377426147, "mean_norm/layer16": 10.189636588096619, "mean_norm/layer17": 10.620143711566925, "mean_norm/layer18": 10.249273598194122, "mean_norm/layer19": 10.28394889831543, "mean_norm/layer2": 8.710040807723999, "mean_norm/layer20": 10.392243266105652, "mean_norm/layer21": 10.345543622970581, "mean_norm/layer22": 11.159203112125397, "mean_norm/layer23": 11.108225405216217, "mean_norm/layer3": 10.59694367647171, "mean_norm/layer4": 9.66866660118103, "mean_norm/layer5": 11.584315299987793, "mean_norm/layer6": 9.278502762317657, "mean_norm/layer7": 9.705314993858337, "mean_norm/layer8": 10.10358864068985, "mean_norm/layer9": 10.047950685024261, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7450 }, { "epoch": 3.11, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46243454488669317, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.741889238357544, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 12.0032, "eval_samples_per_second": 20.078, "eval_steps_per_second": 0.666, "step": 7450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.13, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5378, "max_norm": 28.534168243408203, "max_norm/layer0": 22.058876037597656, "max_norm/layer1": 23.55440330505371, "max_norm/layer10": 24.924272537231445, "max_norm/layer11": 23.644363403320312, "max_norm/layer12": 25.500591278076172, "max_norm/layer13": 22.042232513427734, "max_norm/layer14": 23.674577713012695, "max_norm/layer15": 27.777328491210938, "max_norm/layer16": 23.501466751098633, "max_norm/layer17": 27.558422088623047, "max_norm/layer18": 24.424163818359375, "max_norm/layer19": 23.938682556152344, "max_norm/layer2": 18.931631088256836, "max_norm/layer20": 25.224212646484375, "max_norm/layer21": 24.5081729888916, "max_norm/layer22": 25.363332748413086, "max_norm/layer23": 24.50674819946289, "max_norm/layer3": 22.900821685791016, "max_norm/layer4": 22.509111404418945, "max_norm/layer5": 28.534168243408203, "max_norm/layer6": 19.816333770751953, "max_norm/layer7": 24.353036880493164, "max_norm/layer8": 24.543941497802734, "max_norm/layer9": 24.16282081604004, "mean_norm": 10.267906568944454, "mean_norm/layer0": 9.798717558383942, "mean_norm/layer1": 9.785801529884338, "mean_norm/layer10": 10.14056795835495, "mean_norm/layer11": 10.396467983722687, "mean_norm/layer12": 10.812629520893097, "mean_norm/layer13": 10.113163471221924, "mean_norm/layer14": 10.453515112400055, "mean_norm/layer15": 10.712714493274689, "mean_norm/layer16": 10.200285851955414, "mean_norm/layer17": 10.632267236709595, "mean_norm/layer18": 10.259525001049042, "mean_norm/layer19": 10.294664680957794, "mean_norm/layer2": 8.713631331920624, "mean_norm/layer20": 10.403029263019562, "mean_norm/layer21": 10.356555461883545, "mean_norm/layer22": 11.173887729644775, "mean_norm/layer23": 11.122698366641998, "mean_norm/layer3": 10.61043643951416, "mean_norm/layer4": 9.676729619503021, "mean_norm/layer5": 11.602260768413544, "mean_norm/layer6": 9.284881472587585, "mean_norm/layer7": 9.7137091755867, "mean_norm/layer8": 10.113835334777832, "mean_norm/layer9": 10.057782292366028, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7500 }, { "epoch": 3.13, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4612461112260336, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7466063499450684, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8975, "eval_samples_per_second": 20.256, "eval_steps_per_second": 0.672, "step": 7500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.15, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5262, "max_norm": 28.647478103637695, "max_norm/layer0": 22.12501335144043, "max_norm/layer1": 23.629316329956055, "max_norm/layer10": 25.00779151916504, "max_norm/layer11": 23.737573623657227, "max_norm/layer12": 25.5867919921875, "max_norm/layer13": 22.13935661315918, "max_norm/layer14": 23.769336700439453, "max_norm/layer15": 27.88351821899414, "max_norm/layer16": 23.595199584960938, "max_norm/layer17": 27.670772552490234, "max_norm/layer18": 24.5206241607666, "max_norm/layer19": 24.02391815185547, "max_norm/layer2": 18.966272354125977, "max_norm/layer20": 25.31734848022461, "max_norm/layer21": 24.615201950073242, "max_norm/layer22": 25.462045669555664, "max_norm/layer23": 24.59248924255371, "max_norm/layer3": 22.99334716796875, "max_norm/layer4": 22.572772979736328, "max_norm/layer5": 28.647478103637695, "max_norm/layer6": 19.873327255249023, "max_norm/layer7": 24.456520080566406, "max_norm/layer8": 24.614551544189453, "max_norm/layer9": 24.24704933166504, "mean_norm": 10.278987641135851, "mean_norm/layer0": 9.811449825763702, "mean_norm/layer1": 9.795596778392792, "mean_norm/layer10": 10.150748670101166, "mean_norm/layer11": 10.407971441745758, "mean_norm/layer12": 10.826962232589722, "mean_norm/layer13": 10.123676836490631, "mean_norm/layer14": 10.465408980846405, "mean_norm/layer15": 10.726069808006287, "mean_norm/layer16": 10.210875153541565, "mean_norm/layer17": 10.644302904605865, "mean_norm/layer18": 10.269866168498993, "mean_norm/layer19": 10.305279195308685, "mean_norm/layer2": 8.717224657535553, "mean_norm/layer20": 10.413566410541534, "mean_norm/layer21": 10.367369532585144, "mean_norm/layer22": 11.18840491771698, "mean_norm/layer23": 11.13710218667984, "mean_norm/layer3": 10.623844742774963, "mean_norm/layer4": 9.68492478132248, "mean_norm/layer5": 11.620170950889587, "mean_norm/layer6": 9.291176974773407, "mean_norm/layer7": 9.722011387348175, "mean_norm/layer8": 10.12408995628357, "mean_norm/layer9": 10.067608892917633, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7550 }, { "epoch": 3.15, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4627468636302795, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.742647886276245, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9512, "eval_samples_per_second": 20.165, "eval_steps_per_second": 0.669, "step": 7550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.17, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5466, "max_norm": 28.759456634521484, "max_norm/layer0": 22.189687728881836, "max_norm/layer1": 23.718957901000977, "max_norm/layer10": 25.11297607421875, "max_norm/layer11": 23.83050537109375, "max_norm/layer12": 25.688610076904297, "max_norm/layer13": 22.221534729003906, "max_norm/layer14": 23.87668800354004, "max_norm/layer15": 28.021175384521484, "max_norm/layer16": 23.694242477416992, "max_norm/layer17": 27.787132263183594, "max_norm/layer18": 24.62793731689453, "max_norm/layer19": 24.113933563232422, "max_norm/layer2": 19.001083374023438, "max_norm/layer20": 25.41383171081543, "max_norm/layer21": 24.711917877197266, "max_norm/layer22": 25.558143615722656, "max_norm/layer23": 24.674909591674805, "max_norm/layer3": 23.080352783203125, "max_norm/layer4": 22.64613151550293, "max_norm/layer5": 28.759456634521484, "max_norm/layer6": 19.9383487701416, "max_norm/layer7": 24.539579391479492, "max_norm/layer8": 24.692691802978516, "max_norm/layer9": 24.328855514526367, "mean_norm": 10.29014177620411, "mean_norm/layer0": 9.824274837970734, "mean_norm/layer1": 9.805485486984253, "mean_norm/layer10": 10.160942137241364, "mean_norm/layer11": 10.419573247432709, "mean_norm/layer12": 10.841314256191254, "mean_norm/layer13": 10.134314954280853, "mean_norm/layer14": 10.47724461555481, "mean_norm/layer15": 10.739534556865692, "mean_norm/layer16": 10.221598386764526, "mean_norm/layer17": 10.656368911266327, "mean_norm/layer18": 10.280156254768372, "mean_norm/layer19": 10.315918445587158, "mean_norm/layer2": 8.720892071723938, "mean_norm/layer20": 10.424446642398834, "mean_norm/layer21": 10.378287017345428, "mean_norm/layer22": 11.202922701835632, "mean_norm/layer23": 11.151463150978088, "mean_norm/layer3": 10.637423694133759, "mean_norm/layer4": 9.69320422410965, "mean_norm/layer5": 11.6382976770401, "mean_norm/layer6": 9.297437250614166, "mean_norm/layer7": 9.730381071567535, "mean_norm/layer8": 10.134437918663025, "mean_norm/layer9": 10.077483117580414, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7600 }, { "epoch": 3.17, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4620857213548955, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7406821250915527, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9297, "eval_samples_per_second": 20.202, "eval_steps_per_second": 0.671, "step": 7600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.19, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5417, "max_norm": 28.87610626220703, "max_norm/layer0": 22.26255989074707, "max_norm/layer1": 23.79456329345703, "max_norm/layer10": 25.207901000976562, "max_norm/layer11": 23.90155601501465, "max_norm/layer12": 25.78806495666504, "max_norm/layer13": 22.295835494995117, "max_norm/layer14": 23.981624603271484, "max_norm/layer15": 28.134763717651367, "max_norm/layer16": 23.79250144958496, "max_norm/layer17": 27.918643951416016, "max_norm/layer18": 24.73369598388672, "max_norm/layer19": 24.21535301208496, "max_norm/layer2": 19.049760818481445, "max_norm/layer20": 25.499326705932617, "max_norm/layer21": 24.808273315429688, "max_norm/layer22": 25.657686233520508, "max_norm/layer23": 24.76559829711914, "max_norm/layer3": 23.16707420349121, "max_norm/layer4": 22.7286376953125, "max_norm/layer5": 28.87610626220703, "max_norm/layer6": 19.98716926574707, "max_norm/layer7": 24.625072479248047, "max_norm/layer8": 24.779348373413086, "max_norm/layer9": 24.42043685913086, "mean_norm": 10.301014435787996, "mean_norm/layer0": 9.836885809898376, "mean_norm/layer1": 9.81521886587143, "mean_norm/layer10": 10.170771658420563, "mean_norm/layer11": 10.430792689323425, "mean_norm/layer12": 10.855295896530151, "mean_norm/layer13": 10.144669532775879, "mean_norm/layer14": 10.488730907440186, "mean_norm/layer15": 10.75255537033081, "mean_norm/layer16": 10.232070505619049, "mean_norm/layer17": 10.668150544166565, "mean_norm/layer18": 10.290162086486816, "mean_norm/layer19": 10.326179146766663, "mean_norm/layer2": 8.724476277828217, "mean_norm/layer20": 10.43507844209671, "mean_norm/layer21": 10.388847172260284, "mean_norm/layer22": 11.217085540294647, "mean_norm/layer23": 11.16545057296753, "mean_norm/layer3": 10.650694847106934, "mean_norm/layer4": 9.701324820518494, "mean_norm/layer5": 11.656121969223022, "mean_norm/layer6": 9.303574085235596, "mean_norm/layer7": 9.738611280918121, "mean_norm/layer8": 10.144423842430115, "mean_norm/layer9": 10.087174594402313, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7650 }, { "epoch": 3.19, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4635945859342995, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7404425144195557, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9178, "eval_samples_per_second": 22.074, "eval_steps_per_second": 0.733, "step": 7650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.22, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5543, "max_norm": 28.989912033081055, "max_norm/layer0": 22.333951950073242, "max_norm/layer1": 23.86414909362793, "max_norm/layer10": 25.30396270751953, "max_norm/layer11": 23.973237991333008, "max_norm/layer12": 25.900819778442383, "max_norm/layer13": 22.36374282836914, "max_norm/layer14": 24.077177047729492, "max_norm/layer15": 28.262537002563477, "max_norm/layer16": 23.878515243530273, "max_norm/layer17": 28.032825469970703, "max_norm/layer18": 24.851049423217773, "max_norm/layer19": 24.301414489746094, "max_norm/layer2": 19.102933883666992, "max_norm/layer20": 25.588642120361328, "max_norm/layer21": 24.90848159790039, "max_norm/layer22": 25.761886596679688, "max_norm/layer23": 24.848621368408203, "max_norm/layer3": 23.259109497070312, "max_norm/layer4": 22.849287033081055, "max_norm/layer5": 28.989912033081055, "max_norm/layer6": 20.03278350830078, "max_norm/layer7": 24.701374053955078, "max_norm/layer8": 24.87116050720215, "max_norm/layer9": 24.52387237548828, "mean_norm": 10.31198395540317, "mean_norm/layer0": 9.849559903144836, "mean_norm/layer1": 9.82489401102066, "mean_norm/layer10": 10.180826425552368, "mean_norm/layer11": 10.442092299461365, "mean_norm/layer12": 10.869353592395782, "mean_norm/layer13": 10.155152142047882, "mean_norm/layer14": 10.500398457050323, "mean_norm/layer15": 10.765804052352905, "mean_norm/layer16": 10.242531597614288, "mean_norm/layer17": 10.67978948354721, "mean_norm/layer18": 10.300297379493713, "mean_norm/layer19": 10.336560845375061, "mean_norm/layer2": 8.72812283039093, "mean_norm/layer20": 10.445524156093597, "mean_norm/layer21": 10.399671375751495, "mean_norm/layer22": 11.231338143348694, "mean_norm/layer23": 11.17959988117218, "mean_norm/layer3": 10.664167523384094, "mean_norm/layer4": 9.709515035152435, "mean_norm/layer5": 11.674124658107758, "mean_norm/layer6": 9.309807479381561, "mean_norm/layer7": 9.746842324733734, "mean_norm/layer8": 10.15455275774002, "mean_norm/layer9": 10.09708857536316, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7700 }, { "epoch": 3.22, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4629983410601802, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.741414785385132, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7003, "eval_samples_per_second": 20.598, "eval_steps_per_second": 0.684, "step": 7700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.24, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5553, "max_norm": 29.090238571166992, "max_norm/layer0": 22.41193389892578, "max_norm/layer1": 23.93515396118164, "max_norm/layer10": 25.398143768310547, "max_norm/layer11": 24.047224044799805, "max_norm/layer12": 25.994855880737305, "max_norm/layer13": 22.43844985961914, "max_norm/layer14": 24.178451538085938, "max_norm/layer15": 28.364883422851562, "max_norm/layer16": 23.977371215820312, "max_norm/layer17": 28.133155822753906, "max_norm/layer18": 24.957571029663086, "max_norm/layer19": 24.386947631835938, "max_norm/layer2": 19.165626525878906, "max_norm/layer20": 25.671714782714844, "max_norm/layer21": 25.00211524963379, "max_norm/layer22": 25.86479949951172, "max_norm/layer23": 24.936710357666016, "max_norm/layer3": 23.344837188720703, "max_norm/layer4": 22.948711395263672, "max_norm/layer5": 29.090238571166992, "max_norm/layer6": 20.085012435913086, "max_norm/layer7": 24.796207427978516, "max_norm/layer8": 24.96137809753418, "max_norm/layer9": 24.61630630493164, "mean_norm": 10.322781873246035, "mean_norm/layer0": 9.862114548683167, "mean_norm/layer1": 9.834554076194763, "mean_norm/layer10": 10.19078516960144, "mean_norm/layer11": 10.453184068202972, "mean_norm/layer12": 10.883156538009644, "mean_norm/layer13": 10.16549926996231, "mean_norm/layer14": 10.511900305747986, "mean_norm/layer15": 10.778773725032806, "mean_norm/layer16": 10.252846658229828, "mean_norm/layer17": 10.691301107406616, "mean_norm/layer18": 10.310111284255981, "mean_norm/layer19": 10.346852660179138, "mean_norm/layer2": 8.731664061546326, "mean_norm/layer20": 10.455866873264313, "mean_norm/layer21": 10.410119354724884, "mean_norm/layer22": 11.245464563369751, "mean_norm/layer23": 11.193513989448547, "mean_norm/layer3": 10.677456438541412, "mean_norm/layer4": 9.71753478050232, "mean_norm/layer5": 11.691821098327637, "mean_norm/layer6": 9.316016852855682, "mean_norm/layer7": 9.754923164844513, "mean_norm/layer8": 10.164519965648651, "mean_norm/layer9": 10.106784403324127, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7750 }, { "epoch": 3.24, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46314436021302574, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7383084297180176, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7215, "eval_samples_per_second": 20.56, "eval_steps_per_second": 0.683, "step": 7750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.26, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5628, "max_norm": 29.21254539489746, "max_norm/layer0": 22.484031677246094, "max_norm/layer1": 24.008319854736328, "max_norm/layer10": 25.487390518188477, "max_norm/layer11": 24.109447479248047, "max_norm/layer12": 26.10677146911621, "max_norm/layer13": 22.515703201293945, "max_norm/layer14": 24.291309356689453, "max_norm/layer15": 28.477415084838867, "max_norm/layer16": 24.077625274658203, "max_norm/layer17": 28.249710083007812, "max_norm/layer18": 25.04519271850586, "max_norm/layer19": 24.4896183013916, "max_norm/layer2": 19.21530532836914, "max_norm/layer20": 25.777645111083984, "max_norm/layer21": 25.095863342285156, "max_norm/layer22": 25.952531814575195, "max_norm/layer23": 25.035606384277344, "max_norm/layer3": 23.437124252319336, "max_norm/layer4": 23.04496192932129, "max_norm/layer5": 29.21254539489746, "max_norm/layer6": 20.13669776916504, "max_norm/layer7": 24.908952713012695, "max_norm/layer8": 25.054763793945312, "max_norm/layer9": 24.6956787109375, "mean_norm": 10.33362782249848, "mean_norm/layer0": 9.874791443347931, "mean_norm/layer1": 9.844236731529236, "mean_norm/layer10": 10.200762331485748, "mean_norm/layer11": 10.464483559131622, "mean_norm/layer12": 10.897128105163574, "mean_norm/layer13": 10.175809919834137, "mean_norm/layer14": 10.523499190807343, "mean_norm/layer15": 10.791725218296051, "mean_norm/layer16": 10.263132691383362, "mean_norm/layer17": 10.70292180776596, "mean_norm/layer18": 10.320022165775299, "mean_norm/layer19": 10.357090592384338, "mean_norm/layer2": 8.735245108604431, "mean_norm/layer20": 10.466160774230957, "mean_norm/layer21": 10.42063820362091, "mean_norm/layer22": 11.259634852409363, "mean_norm/layer23": 11.207477986812592, "mean_norm/layer3": 10.69071638584137, "mean_norm/layer4": 9.72552090883255, "mean_norm/layer5": 11.709686279296875, "mean_norm/layer6": 9.32220333814621, "mean_norm/layer7": 9.763081669807434, "mean_norm/layer8": 10.174527645111084, "mean_norm/layer9": 10.116570830345154, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7800 }, { "epoch": 3.26, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4632457624025018, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.736220121383667, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9335, "eval_samples_per_second": 20.195, "eval_steps_per_second": 0.67, "step": 7800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.28, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5544, "max_norm": 29.331188201904297, "max_norm/layer0": 22.55216407775879, "max_norm/layer1": 24.07997703552246, "max_norm/layer10": 25.5628719329834, "max_norm/layer11": 24.17657470703125, "max_norm/layer12": 26.19219970703125, "max_norm/layer13": 22.586214065551758, "max_norm/layer14": 24.382736206054688, "max_norm/layer15": 28.602956771850586, "max_norm/layer16": 24.1601619720459, "max_norm/layer17": 28.35554313659668, "max_norm/layer18": 25.14252281188965, "max_norm/layer19": 24.595355987548828, "max_norm/layer2": 19.27031135559082, "max_norm/layer20": 25.8691463470459, "max_norm/layer21": 25.18440055847168, "max_norm/layer22": 26.064830780029297, "max_norm/layer23": 25.118104934692383, "max_norm/layer3": 23.54576301574707, "max_norm/layer4": 23.14463996887207, "max_norm/layer5": 29.331188201904297, "max_norm/layer6": 20.195871353149414, "max_norm/layer7": 25.005327224731445, "max_norm/layer8": 25.13247299194336, "max_norm/layer9": 24.790437698364258, "mean_norm": 10.344553100566069, "mean_norm/layer0": 9.88759696483612, "mean_norm/layer1": 9.854110896587372, "mean_norm/layer10": 10.210679829120636, "mean_norm/layer11": 10.475803256034851, "mean_norm/layer12": 10.911135852336884, "mean_norm/layer13": 10.186229526996613, "mean_norm/layer14": 10.535084962844849, "mean_norm/layer15": 10.804824233055115, "mean_norm/layer16": 10.273425579071045, "mean_norm/layer17": 10.714586555957794, "mean_norm/layer18": 10.32996690273285, "mean_norm/layer19": 10.367372214794159, "mean_norm/layer2": 8.738913834095001, "mean_norm/layer20": 10.476485311985016, "mean_norm/layer21": 10.431126654148102, "mean_norm/layer22": 11.273919343948364, "mean_norm/layer23": 11.221592783927917, "mean_norm/layer3": 10.70423948764801, "mean_norm/layer4": 9.73361724615097, "mean_norm/layer5": 11.727725446224213, "mean_norm/layer6": 9.328507781028748, "mean_norm/layer7": 9.771354794502258, "mean_norm/layer8": 10.184631109237671, "mean_norm/layer9": 10.126343846321106, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7850 }, { "epoch": 3.28, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46365542724798514, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.735917329788208, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9355, "eval_samples_per_second": 20.192, "eval_steps_per_second": 0.67, "step": 7850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.3, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5519, "max_norm": 29.44374656677246, "max_norm/layer0": 22.62066650390625, "max_norm/layer1": 24.155412673950195, "max_norm/layer10": 25.649127960205078, "max_norm/layer11": 24.254257202148438, "max_norm/layer12": 26.287227630615234, "max_norm/layer13": 22.658599853515625, "max_norm/layer14": 24.459514617919922, "max_norm/layer15": 28.717144012451172, "max_norm/layer16": 24.274436950683594, "max_norm/layer17": 28.46417808532715, "max_norm/layer18": 25.246158599853516, "max_norm/layer19": 24.703245162963867, "max_norm/layer2": 19.330106735229492, "max_norm/layer20": 25.960447311401367, "max_norm/layer21": 25.28472328186035, "max_norm/layer22": 26.16750717163086, "max_norm/layer23": 25.200824737548828, "max_norm/layer3": 23.6591854095459, "max_norm/layer4": 23.238862991333008, "max_norm/layer5": 29.44374656677246, "max_norm/layer6": 20.259044647216797, "max_norm/layer7": 25.118812561035156, "max_norm/layer8": 25.218399047851562, "max_norm/layer9": 24.899673461914062, "mean_norm": 10.355501912534237, "mean_norm/layer0": 9.900353372097015, "mean_norm/layer1": 9.86406821012497, "mean_norm/layer10": 10.220719993114471, "mean_norm/layer11": 10.48711621761322, "mean_norm/layer12": 10.925248146057129, "mean_norm/layer13": 10.196601510047913, "mean_norm/layer14": 10.546653389930725, "mean_norm/layer15": 10.817915558815002, "mean_norm/layer16": 10.283754646778107, "mean_norm/layer17": 10.726405084133148, "mean_norm/layer18": 10.339860618114471, "mean_norm/layer19": 10.377592206001282, "mean_norm/layer2": 8.742589831352234, "mean_norm/layer20": 10.486961722373962, "mean_norm/layer21": 10.441667020320892, "mean_norm/layer22": 11.288079738616943, "mean_norm/layer23": 11.235736012458801, "mean_norm/layer3": 10.717736423015594, "mean_norm/layer4": 9.74189966917038, "mean_norm/layer5": 11.745728731155396, "mean_norm/layer6": 9.33476859331131, "mean_norm/layer7": 9.779621005058289, "mean_norm/layer8": 10.194773256778717, "mean_norm/layer9": 10.136194944381714, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7900 }, { "epoch": 3.3, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46300645323533823, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7365753650665283, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9411, "eval_samples_per_second": 22.027, "eval_steps_per_second": 0.731, "step": 7900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.32, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5604, "max_norm": 29.56292724609375, "max_norm/layer0": 22.706741333007812, "max_norm/layer1": 24.238323211669922, "max_norm/layer10": 25.757524490356445, "max_norm/layer11": 24.320594787597656, "max_norm/layer12": 26.380447387695312, "max_norm/layer13": 22.746694564819336, "max_norm/layer14": 24.556163787841797, "max_norm/layer15": 28.821693420410156, "max_norm/layer16": 24.36968994140625, "max_norm/layer17": 28.576396942138672, "max_norm/layer18": 25.369043350219727, "max_norm/layer19": 24.811838150024414, "max_norm/layer2": 19.388208389282227, "max_norm/layer20": 26.059162139892578, "max_norm/layer21": 25.400894165039062, "max_norm/layer22": 26.286211013793945, "max_norm/layer23": 25.288856506347656, "max_norm/layer3": 23.755037307739258, "max_norm/layer4": 23.329593658447266, "max_norm/layer5": 29.56292724609375, "max_norm/layer6": 20.32733154296875, "max_norm/layer7": 25.217721939086914, "max_norm/layer8": 25.305147171020508, "max_norm/layer9": 24.998611450195312, "mean_norm": 10.366318744917711, "mean_norm/layer0": 9.913071632385254, "mean_norm/layer1": 9.87394368648529, "mean_norm/layer10": 10.230653047561646, "mean_norm/layer11": 10.498328745365143, "mean_norm/layer12": 10.939123094081879, "mean_norm/layer13": 10.206881523132324, "mean_norm/layer14": 10.558052361011505, "mean_norm/layer15": 10.830873608589172, "mean_norm/layer16": 10.293963611125946, "mean_norm/layer17": 10.738054513931274, "mean_norm/layer18": 10.349761128425598, "mean_norm/layer19": 10.387810349464417, "mean_norm/layer2": 8.7461838722229, "mean_norm/layer20": 10.49695074558258, "mean_norm/layer21": 10.451958894729614, "mean_norm/layer22": 11.301961421966553, "mean_norm/layer23": 11.249614596366882, "mean_norm/layer3": 10.73119992017746, "mean_norm/layer4": 9.750132262706757, "mean_norm/layer5": 11.763619303703308, "mean_norm/layer6": 9.34090131521225, "mean_norm/layer7": 9.787860095500946, "mean_norm/layer8": 10.204774379730225, "mean_norm/layer9": 10.145975768566132, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 7950 }, { "epoch": 3.32, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4639434094660972, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7317562103271484, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7183, "eval_samples_per_second": 20.566, "eval_steps_per_second": 0.683, "step": 7950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.34, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.574, "max_norm": 29.686235427856445, "max_norm/layer0": 22.817535400390625, "max_norm/layer1": 24.31894302368164, "max_norm/layer10": 25.852500915527344, "max_norm/layer11": 24.389923095703125, "max_norm/layer12": 26.46706199645996, "max_norm/layer13": 22.830928802490234, "max_norm/layer14": 24.660869598388672, "max_norm/layer15": 28.929563522338867, "max_norm/layer16": 24.46345329284668, "max_norm/layer17": 28.688806533813477, "max_norm/layer18": 25.51277732849121, "max_norm/layer19": 24.911882400512695, "max_norm/layer2": 19.448562622070312, "max_norm/layer20": 26.146984100341797, "max_norm/layer21": 25.494787216186523, "max_norm/layer22": 26.37640953063965, "max_norm/layer23": 25.375213623046875, "max_norm/layer3": 23.8410701751709, "max_norm/layer4": 23.417619705200195, "max_norm/layer5": 29.686235427856445, "max_norm/layer6": 20.39133071899414, "max_norm/layer7": 25.319486618041992, "max_norm/layer8": 25.389860153198242, "max_norm/layer9": 25.100292205810547, "mean_norm": 10.377166591584682, "mean_norm/layer0": 9.92577999830246, "mean_norm/layer1": 9.883734285831451, "mean_norm/layer10": 10.240622818470001, "mean_norm/layer11": 10.509494483470917, "mean_norm/layer12": 10.953135788440704, "mean_norm/layer13": 10.217233061790466, "mean_norm/layer14": 10.569559216499329, "mean_norm/layer15": 10.843758702278137, "mean_norm/layer16": 10.30425751209259, "mean_norm/layer17": 10.749723374843597, "mean_norm/layer18": 10.359737277030945, "mean_norm/layer19": 10.398090779781342, "mean_norm/layer2": 8.749907433986664, "mean_norm/layer20": 10.507069289684296, "mean_norm/layer21": 10.462173759937286, "mean_norm/layer22": 11.315882444381714, "mean_norm/layer23": 11.263618886470795, "mean_norm/layer3": 10.744675993919373, "mean_norm/layer4": 9.758215069770813, "mean_norm/layer5": 11.781563222408295, "mean_norm/layer6": 9.347027242183685, "mean_norm/layer7": 9.796038210391998, "mean_norm/layer8": 10.214890122413635, "mean_norm/layer9": 10.155809223651886, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8000 }, { "epoch": 3.34, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46419488689599786, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7337546348571777, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9253, "eval_samples_per_second": 22.059, "eval_steps_per_second": 0.732, "step": 8000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.36, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5681, "max_norm": 29.79633331298828, "max_norm/layer0": 22.923782348632812, "max_norm/layer1": 24.38690185546875, "max_norm/layer10": 25.94072151184082, "max_norm/layer11": 24.459306716918945, "max_norm/layer12": 26.563783645629883, "max_norm/layer13": 22.916555404663086, "max_norm/layer14": 24.759183883666992, "max_norm/layer15": 29.03226089477539, "max_norm/layer16": 24.558034896850586, "max_norm/layer17": 28.802165985107422, "max_norm/layer18": 25.61612892150879, "max_norm/layer19": 25.000877380371094, "max_norm/layer2": 19.50658416748047, "max_norm/layer20": 26.22553253173828, "max_norm/layer21": 25.60858726501465, "max_norm/layer22": 26.475278854370117, "max_norm/layer23": 25.460458755493164, "max_norm/layer3": 23.920320510864258, "max_norm/layer4": 23.51832389831543, "max_norm/layer5": 29.79633331298828, "max_norm/layer6": 20.452802658081055, "max_norm/layer7": 25.421403884887695, "max_norm/layer8": 25.46021270751953, "max_norm/layer9": 25.197437286376953, "mean_norm": 10.387797482311726, "mean_norm/layer0": 9.938105344772339, "mean_norm/layer1": 9.893487989902496, "mean_norm/layer10": 10.250402808189392, "mean_norm/layer11": 10.520434379577637, "mean_norm/layer12": 10.96678900718689, "mean_norm/layer13": 10.227465033531189, "mean_norm/layer14": 10.580823600292206, "mean_norm/layer15": 10.856427371501923, "mean_norm/layer16": 10.314347922801971, "mean_norm/layer17": 10.761028468608856, "mean_norm/layer18": 10.369467556476593, "mean_norm/layer19": 10.408168733119965, "mean_norm/layer2": 8.753524899482727, "mean_norm/layer20": 10.516979813575745, "mean_norm/layer21": 10.47218245267868, "mean_norm/layer22": 11.329629778862, "mean_norm/layer23": 11.277422606945038, "mean_norm/layer3": 10.75775521993637, "mean_norm/layer4": 9.766146004199982, "mean_norm/layer5": 11.799201905727386, "mean_norm/layer6": 9.35314804315567, "mean_norm/layer7": 9.804097712039948, "mean_norm/layer8": 10.22478049993515, "mean_norm/layer9": 10.165322422981262, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8050 }, { "epoch": 3.36, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46359864202187856, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7321524620056152, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9139, "eval_samples_per_second": 20.228, "eval_steps_per_second": 0.671, "step": 8050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.38, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5672, "max_norm": 29.917709350585938, "max_norm/layer0": 23.026636123657227, "max_norm/layer1": 24.44870376586914, "max_norm/layer10": 26.026018142700195, "max_norm/layer11": 24.52729034423828, "max_norm/layer12": 26.678749084472656, "max_norm/layer13": 23.003549575805664, "max_norm/layer14": 24.862823486328125, "max_norm/layer15": 29.15134048461914, "max_norm/layer16": 24.638816833496094, "max_norm/layer17": 28.92781639099121, "max_norm/layer18": 25.733177185058594, "max_norm/layer19": 25.097875595092773, "max_norm/layer2": 19.571752548217773, "max_norm/layer20": 26.306419372558594, "max_norm/layer21": 25.732044219970703, "max_norm/layer22": 26.59418296813965, "max_norm/layer23": 25.56702995300293, "max_norm/layer3": 23.995433807373047, "max_norm/layer4": 23.631168365478516, "max_norm/layer5": 29.917709350585938, "max_norm/layer6": 20.507673263549805, "max_norm/layer7": 25.506603240966797, "max_norm/layer8": 25.542097091674805, "max_norm/layer9": 25.293928146362305, "mean_norm": 10.398542570571104, "mean_norm/layer0": 9.950576424598694, "mean_norm/layer1": 9.903380393981934, "mean_norm/layer10": 10.2602379322052, "mean_norm/layer11": 10.531521320343018, "mean_norm/layer12": 10.980621695518494, "mean_norm/layer13": 10.237708628177643, "mean_norm/layer14": 10.592123091220856, "mean_norm/layer15": 10.86921912431717, "mean_norm/layer16": 10.324528396129608, "mean_norm/layer17": 10.772493362426758, "mean_norm/layer18": 10.379202902317047, "mean_norm/layer19": 10.41831624507904, "mean_norm/layer2": 8.757138550281525, "mean_norm/layer20": 10.527169048786163, "mean_norm/layer21": 10.482528150081635, "mean_norm/layer22": 11.343506574630737, "mean_norm/layer23": 11.291179537773132, "mean_norm/layer3": 10.771021962165833, "mean_norm/layer4": 9.77420699596405, "mean_norm/layer5": 11.816980540752411, "mean_norm/layer6": 9.359247148036957, "mean_norm/layer7": 9.812303245067596, "mean_norm/layer8": 10.234733879566193, "mean_norm/layer9": 10.17507654428482, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8100 }, { "epoch": 3.38, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46344856678145396, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7265894412994385, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.773, "eval_samples_per_second": 20.471, "eval_steps_per_second": 0.68, "step": 8100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.4, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5544, "max_norm": 30.036163330078125, "max_norm/layer0": 23.137466430664062, "max_norm/layer1": 24.516328811645508, "max_norm/layer10": 26.114761352539062, "max_norm/layer11": 24.583471298217773, "max_norm/layer12": 26.794891357421875, "max_norm/layer13": 23.09189224243164, "max_norm/layer14": 24.96297264099121, "max_norm/layer15": 29.24390983581543, "max_norm/layer16": 24.714712142944336, "max_norm/layer17": 29.043437957763672, "max_norm/layer18": 25.807891845703125, "max_norm/layer19": 25.197919845581055, "max_norm/layer2": 19.644575119018555, "max_norm/layer20": 26.390174865722656, "max_norm/layer21": 25.839521408081055, "max_norm/layer22": 26.697118759155273, "max_norm/layer23": 25.650402069091797, "max_norm/layer3": 24.080507278442383, "max_norm/layer4": 23.73740577697754, "max_norm/layer5": 30.036163330078125, "max_norm/layer6": 20.57171058654785, "max_norm/layer7": 25.5966739654541, "max_norm/layer8": 25.62618637084961, "max_norm/layer9": 25.398679733276367, "mean_norm": 10.409372217953205, "mean_norm/layer0": 9.963123381137848, "mean_norm/layer1": 9.913290679454803, "mean_norm/layer10": 10.270268023014069, "mean_norm/layer11": 10.542797803878784, "mean_norm/layer12": 10.994561910629272, "mean_norm/layer13": 10.248073875904083, "mean_norm/layer14": 10.603521823883057, "mean_norm/layer15": 10.882000625133514, "mean_norm/layer16": 10.334827065467834, "mean_norm/layer17": 10.784078478813171, "mean_norm/layer18": 10.389080286026001, "mean_norm/layer19": 10.428483843803406, "mean_norm/layer2": 8.760785043239594, "mean_norm/layer20": 10.537615478038788, "mean_norm/layer21": 10.492811977863312, "mean_norm/layer22": 11.357585430145264, "mean_norm/layer23": 11.305007696151733, "mean_norm/layer3": 10.784351646900177, "mean_norm/layer4": 9.78234201669693, "mean_norm/layer5": 11.834979832172394, "mean_norm/layer6": 9.365468978881836, "mean_norm/layer7": 9.820427119731903, "mean_norm/layer8": 10.244697272777557, "mean_norm/layer9": 10.184752941131592, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8150 }, { "epoch": 3.4, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4645639908656908, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7237918376922607, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9291, "eval_samples_per_second": 20.203, "eval_steps_per_second": 0.671, "step": 8150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.42, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5709, "max_norm": 30.166780471801758, "max_norm/layer0": 23.243453979492188, "max_norm/layer1": 24.587581634521484, "max_norm/layer10": 26.202739715576172, "max_norm/layer11": 24.643613815307617, "max_norm/layer12": 26.904972076416016, "max_norm/layer13": 23.170438766479492, "max_norm/layer14": 25.052398681640625, "max_norm/layer15": 29.362018585205078, "max_norm/layer16": 24.78993034362793, "max_norm/layer17": 29.15652847290039, "max_norm/layer18": 25.90541648864746, "max_norm/layer19": 25.296329498291016, "max_norm/layer2": 19.711423873901367, "max_norm/layer20": 26.483051300048828, "max_norm/layer21": 25.928726196289062, "max_norm/layer22": 26.79326629638672, "max_norm/layer23": 25.732973098754883, "max_norm/layer3": 24.16873550415039, "max_norm/layer4": 23.828855514526367, "max_norm/layer5": 30.166780471801758, "max_norm/layer6": 20.63398551940918, "max_norm/layer7": 25.68387794494629, "max_norm/layer8": 25.716650009155273, "max_norm/layer9": 25.49351692199707, "mean_norm": 10.420199210445086, "mean_norm/layer0": 9.975629687309265, "mean_norm/layer1": 9.923239886760712, "mean_norm/layer10": 10.280281364917755, "mean_norm/layer11": 10.553914904594421, "mean_norm/layer12": 11.008561134338379, "mean_norm/layer13": 10.25827956199646, "mean_norm/layer14": 10.61497974395752, "mean_norm/layer15": 10.894914627075195, "mean_norm/layer16": 10.345185399055481, "mean_norm/layer17": 10.795701205730438, "mean_norm/layer18": 10.398858368396759, "mean_norm/layer19": 10.43862897157669, "mean_norm/layer2": 8.76432204246521, "mean_norm/layer20": 10.54761826992035, "mean_norm/layer21": 10.503165245056152, "mean_norm/layer22": 11.37176662683487, "mean_norm/layer23": 11.318861424922943, "mean_norm/layer3": 10.797767579555511, "mean_norm/layer4": 9.79049038887024, "mean_norm/layer5": 11.852981925010681, "mean_norm/layer6": 9.371674835681915, "mean_norm/layer7": 9.828672230243683, "mean_norm/layer8": 10.254789173603058, "mean_norm/layer9": 10.19449645280838, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8200 }, { "epoch": 3.42, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46372032464924984, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7265851497650146, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9418, "eval_samples_per_second": 20.181, "eval_steps_per_second": 0.67, "step": 8200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.44, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5516, "max_norm": 30.276281356811523, "max_norm/layer0": 23.351200103759766, "max_norm/layer1": 24.666385650634766, "max_norm/layer10": 26.298505783081055, "max_norm/layer11": 24.71743392944336, "max_norm/layer12": 27.001976013183594, "max_norm/layer13": 23.236825942993164, "max_norm/layer14": 25.13396644592285, "max_norm/layer15": 29.4676513671875, "max_norm/layer16": 24.866540908813477, "max_norm/layer17": 29.276226043701172, "max_norm/layer18": 26.03716278076172, "max_norm/layer19": 25.378047943115234, "max_norm/layer2": 19.76215934753418, "max_norm/layer20": 26.57210922241211, "max_norm/layer21": 26.011999130249023, "max_norm/layer22": 26.882152557373047, "max_norm/layer23": 25.821067810058594, "max_norm/layer3": 24.24490737915039, "max_norm/layer4": 23.920644760131836, "max_norm/layer5": 30.276281356811523, "max_norm/layer6": 20.692121505737305, "max_norm/layer7": 25.77505874633789, "max_norm/layer8": 25.806955337524414, "max_norm/layer9": 25.58926773071289, "mean_norm": 10.430931073923906, "mean_norm/layer0": 9.98804497718811, "mean_norm/layer1": 9.933098196983337, "mean_norm/layer10": 10.290146708488464, "mean_norm/layer11": 10.565122425556183, "mean_norm/layer12": 11.022390842437744, "mean_norm/layer13": 10.268523097038269, "mean_norm/layer14": 10.62632930278778, "mean_norm/layer15": 10.907580077648163, "mean_norm/layer16": 10.35539186000824, "mean_norm/layer17": 10.807102382183075, "mean_norm/layer18": 10.408660113811493, "mean_norm/layer19": 10.448697566986084, "mean_norm/layer2": 8.767856657505035, "mean_norm/layer20": 10.557779371738434, "mean_norm/layer21": 10.513407111167908, "mean_norm/layer22": 11.38557916879654, "mean_norm/layer23": 11.332580626010895, "mean_norm/layer3": 10.811109960079193, "mean_norm/layer4": 9.798513650894165, "mean_norm/layer5": 11.87085086107254, "mean_norm/layer6": 9.377831220626831, "mean_norm/layer7": 9.836784183979034, "mean_norm/layer8": 10.264754116535187, "mean_norm/layer9": 10.204211294651031, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8250 }, { "epoch": 3.44, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46428006473515776, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7251768112182617, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7806, "eval_samples_per_second": 20.457, "eval_steps_per_second": 0.679, "step": 8250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.47, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5684, "max_norm": 30.39374351501465, "max_norm/layer0": 23.451919555664062, "max_norm/layer1": 24.738218307495117, "max_norm/layer10": 26.394065856933594, "max_norm/layer11": 24.77541732788086, "max_norm/layer12": 27.105628967285156, "max_norm/layer13": 23.32464027404785, "max_norm/layer14": 25.2191162109375, "max_norm/layer15": 29.590665817260742, "max_norm/layer16": 24.959054946899414, "max_norm/layer17": 29.399641036987305, "max_norm/layer18": 26.127994537353516, "max_norm/layer19": 25.49078941345215, "max_norm/layer2": 19.80423927307129, "max_norm/layer20": 26.659399032592773, "max_norm/layer21": 26.106576919555664, "max_norm/layer22": 26.97296905517578, "max_norm/layer23": 25.90880584716797, "max_norm/layer3": 24.324474334716797, "max_norm/layer4": 24.0111083984375, "max_norm/layer5": 30.39374351501465, "max_norm/layer6": 20.750532150268555, "max_norm/layer7": 25.87520980834961, "max_norm/layer8": 25.891870498657227, "max_norm/layer9": 25.693950653076172, "mean_norm": 10.441620844105879, "mean_norm/layer0": 10.000455558300018, "mean_norm/layer1": 9.942868113517761, "mean_norm/layer10": 10.300001859664917, "mean_norm/layer11": 10.5762220621109, "mean_norm/layer12": 11.036210000514984, "mean_norm/layer13": 10.27873706817627, "mean_norm/layer14": 10.63762879371643, "mean_norm/layer15": 10.920246362686157, "mean_norm/layer16": 10.365561723709106, "mean_norm/layer17": 10.818557620048523, "mean_norm/layer18": 10.418470799922943, "mean_norm/layer19": 10.458708882331848, "mean_norm/layer2": 8.771406590938568, "mean_norm/layer20": 10.567735850811005, "mean_norm/layer21": 10.523515522480011, "mean_norm/layer22": 11.399278342723846, "mean_norm/layer23": 11.346218764781952, "mean_norm/layer3": 10.824534296989441, "mean_norm/layer4": 9.806449353694916, "mean_norm/layer5": 11.888680815696716, "mean_norm/layer6": 9.383990585803986, "mean_norm/layer7": 9.844885289669037, "mean_norm/layer8": 10.274694323539734, "mean_norm/layer9": 10.213841676712036, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8300 }, { "epoch": 3.47, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46520079661560054, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7237327098846436, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9328, "eval_samples_per_second": 20.196, "eval_steps_per_second": 0.67, "step": 8300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.49, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5825, "max_norm": 30.522048950195312, "max_norm/layer0": 23.55970573425293, "max_norm/layer1": 24.81685447692871, "max_norm/layer10": 26.48958396911621, "max_norm/layer11": 24.84947395324707, "max_norm/layer12": 27.182397842407227, "max_norm/layer13": 23.40679168701172, "max_norm/layer14": 25.298507690429688, "max_norm/layer15": 29.69232749938965, "max_norm/layer16": 25.0523624420166, "max_norm/layer17": 29.538833618164062, "max_norm/layer18": 26.200260162353516, "max_norm/layer19": 25.59515380859375, "max_norm/layer2": 19.851430892944336, "max_norm/layer20": 26.742952346801758, "max_norm/layer21": 26.21401596069336, "max_norm/layer22": 27.071521759033203, "max_norm/layer23": 25.991113662719727, "max_norm/layer3": 24.40773582458496, "max_norm/layer4": 24.08420753479004, "max_norm/layer5": 30.522048950195312, "max_norm/layer6": 20.804243087768555, "max_norm/layer7": 25.957096099853516, "max_norm/layer8": 25.9805965423584, "max_norm/layer9": 25.79876708984375, "mean_norm": 10.452224182585875, "mean_norm/layer0": 10.012845158576965, "mean_norm/layer1": 9.95258343219757, "mean_norm/layer10": 10.309782326221466, "mean_norm/layer11": 10.58720487356186, "mean_norm/layer12": 11.049781918525696, "mean_norm/layer13": 10.288818776607513, "mean_norm/layer14": 10.648904502391815, "mean_norm/layer15": 10.932937741279602, "mean_norm/layer16": 10.375604629516602, "mean_norm/layer17": 10.829921543598175, "mean_norm/layer18": 10.428043961524963, "mean_norm/layer19": 10.468553483486176, "mean_norm/layer2": 8.774953544139862, "mean_norm/layer20": 10.577674269676208, "mean_norm/layer21": 10.533466219902039, "mean_norm/layer22": 11.413104712963104, "mean_norm/layer23": 11.359838545322418, "mean_norm/layer3": 10.837815344333649, "mean_norm/layer4": 9.814239382743835, "mean_norm/layer5": 11.906380355358124, "mean_norm/layer6": 9.39007294178009, "mean_norm/layer7": 9.852976441383362, "mean_norm/layer8": 10.284550070762634, "mean_norm/layer9": 10.223326206207275, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8350 }, { "epoch": 3.49, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4650101604993855, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7208874225616455, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.9067, "eval_samples_per_second": 22.096, "eval_steps_per_second": 0.733, "step": 8350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.51, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5674, "max_norm": 30.639392852783203, "max_norm/layer0": 23.658632278442383, "max_norm/layer1": 24.890296936035156, "max_norm/layer10": 26.574634552001953, "max_norm/layer11": 24.93674659729004, "max_norm/layer12": 27.2740478515625, "max_norm/layer13": 23.50137710571289, "max_norm/layer14": 25.371257781982422, "max_norm/layer15": 29.808671951293945, "max_norm/layer16": 25.12998390197754, "max_norm/layer17": 29.665565490722656, "max_norm/layer18": 26.2768497467041, "max_norm/layer19": 25.701955795288086, "max_norm/layer2": 19.902111053466797, "max_norm/layer20": 26.831134796142578, "max_norm/layer21": 26.28788948059082, "max_norm/layer22": 27.162761688232422, "max_norm/layer23": 26.07558250427246, "max_norm/layer3": 24.493680953979492, "max_norm/layer4": 24.156644821166992, "max_norm/layer5": 30.639392852783203, "max_norm/layer6": 20.861595153808594, "max_norm/layer7": 26.031085968017578, "max_norm/layer8": 26.07181167602539, "max_norm/layer9": 25.8958740234375, "mean_norm": 10.462683290243149, "mean_norm/layer0": 10.02505087852478, "mean_norm/layer1": 9.962117493152618, "mean_norm/layer10": 10.319499015808105, "mean_norm/layer11": 10.598048448562622, "mean_norm/layer12": 11.06323504447937, "mean_norm/layer13": 10.298875629901886, "mean_norm/layer14": 10.660021245479584, "mean_norm/layer15": 10.945443570613861, "mean_norm/layer16": 10.38556182384491, "mean_norm/layer17": 10.84118789434433, "mean_norm/layer18": 10.43755179643631, "mean_norm/layer19": 10.47838807106018, "mean_norm/layer2": 8.778468549251556, "mean_norm/layer20": 10.587294101715088, "mean_norm/layer21": 10.54331248998642, "mean_norm/layer22": 11.42659991979599, "mean_norm/layer23": 11.373156070709229, "mean_norm/layer3": 10.850870013237, "mean_norm/layer4": 9.821917593479156, "mean_norm/layer5": 11.923875868320465, "mean_norm/layer6": 9.39600282907486, "mean_norm/layer7": 9.860944926738739, "mean_norm/layer8": 10.294282972812653, "mean_norm/layer9": 10.23269271850586, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8400 }, { "epoch": 3.51, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4650669457254921, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.718179702758789, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.889, "eval_samples_per_second": 22.132, "eval_steps_per_second": 0.735, "step": 8400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.53, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5798, "max_norm": 30.766651153564453, "max_norm/layer0": 23.751983642578125, "max_norm/layer1": 24.96283531188965, "max_norm/layer10": 26.6643009185791, "max_norm/layer11": 25.018144607543945, "max_norm/layer12": 27.3858699798584, "max_norm/layer13": 23.57953453063965, "max_norm/layer14": 25.471681594848633, "max_norm/layer15": 29.91374969482422, "max_norm/layer16": 25.209827423095703, "max_norm/layer17": 29.779539108276367, "max_norm/layer18": 26.364397048950195, "max_norm/layer19": 25.807302474975586, "max_norm/layer2": 19.943843841552734, "max_norm/layer20": 26.922224044799805, "max_norm/layer21": 26.374265670776367, "max_norm/layer22": 27.24306869506836, "max_norm/layer23": 26.16399383544922, "max_norm/layer3": 24.571680068969727, "max_norm/layer4": 24.2481689453125, "max_norm/layer5": 30.766651153564453, "max_norm/layer6": 20.909099578857422, "max_norm/layer7": 26.11029624938965, "max_norm/layer8": 26.175079345703125, "max_norm/layer9": 25.993101119995117, "mean_norm": 10.473153608540693, "mean_norm/layer0": 10.037110924720764, "mean_norm/layer1": 9.971767902374268, "mean_norm/layer10": 10.329081892967224, "mean_norm/layer11": 10.608945548534393, "mean_norm/layer12": 11.076784670352936, "mean_norm/layer13": 10.308919906616211, "mean_norm/layer14": 10.671100199222565, "mean_norm/layer15": 10.958038628101349, "mean_norm/layer16": 10.395552039146423, "mean_norm/layer17": 10.852413356304169, "mean_norm/layer18": 10.447036266326904, "mean_norm/layer19": 10.488157510757446, "mean_norm/layer2": 8.781982839107513, "mean_norm/layer20": 10.596912443637848, "mean_norm/layer21": 10.553145587444305, "mean_norm/layer22": 11.439911663532257, "mean_norm/layer23": 11.386568009853363, "mean_norm/layer3": 10.86396187543869, "mean_norm/layer4": 9.82959532737732, "mean_norm/layer5": 11.941483497619629, "mean_norm/layer6": 9.401970863342285, "mean_norm/layer7": 9.869019269943237, "mean_norm/layer8": 10.30410349369049, "mean_norm/layer9": 10.242122888565063, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8450 }, { "epoch": 3.53, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4649087583099094, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7157468795776367, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9398, "eval_samples_per_second": 20.185, "eval_steps_per_second": 0.67, "step": 8450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.55, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5788, "max_norm": 30.9117374420166, "max_norm/layer0": 23.839109420776367, "max_norm/layer1": 25.04669761657715, "max_norm/layer10": 26.760334014892578, "max_norm/layer11": 25.07632827758789, "max_norm/layer12": 27.48368263244629, "max_norm/layer13": 23.673465728759766, "max_norm/layer14": 25.5750675201416, "max_norm/layer15": 30.018980026245117, "max_norm/layer16": 25.29213523864746, "max_norm/layer17": 29.91062355041504, "max_norm/layer18": 26.471200942993164, "max_norm/layer19": 25.893930435180664, "max_norm/layer2": 20.0001220703125, "max_norm/layer20": 27.020864486694336, "max_norm/layer21": 26.478113174438477, "max_norm/layer22": 27.32907485961914, "max_norm/layer23": 26.25127410888672, "max_norm/layer3": 24.64104652404785, "max_norm/layer4": 24.34300994873047, "max_norm/layer5": 30.9117374420166, "max_norm/layer6": 20.962677001953125, "max_norm/layer7": 26.191547393798828, "max_norm/layer8": 26.274858474731445, "max_norm/layer9": 26.109769821166992, "mean_norm": 10.483579012254873, "mean_norm/layer0": 10.04910922050476, "mean_norm/layer1": 9.981406450271606, "mean_norm/layer10": 10.33859497308731, "mean_norm/layer11": 10.619703590869904, "mean_norm/layer12": 11.090156137943268, "mean_norm/layer13": 10.31883031129837, "mean_norm/layer14": 10.682014226913452, "mean_norm/layer15": 10.970479130744934, "mean_norm/layer16": 10.405543386936188, "mean_norm/layer17": 10.863610625267029, "mean_norm/layer18": 10.4564608335495, "mean_norm/layer19": 10.497778236865997, "mean_norm/layer2": 8.785513758659363, "mean_norm/layer20": 10.606768667697906, "mean_norm/layer21": 10.5628901720047, "mean_norm/layer22": 11.453165590763092, "mean_norm/layer23": 11.399942815303802, "mean_norm/layer3": 10.876989305019379, "mean_norm/layer4": 9.837391912937164, "mean_norm/layer5": 11.959004819393158, "mean_norm/layer6": 9.407935559749603, "mean_norm/layer7": 9.877058207988739, "mean_norm/layer8": 10.313934981822968, "mean_norm/layer9": 10.25161337852478, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8500 }, { "epoch": 3.55, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46567130277476954, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.716278314590454, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9286, "eval_samples_per_second": 20.203, "eval_steps_per_second": 0.671, "step": 8500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.57, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.574, "max_norm": 31.035043716430664, "max_norm/layer0": 23.93219757080078, "max_norm/layer1": 25.118915557861328, "max_norm/layer10": 26.85211181640625, "max_norm/layer11": 25.140438079833984, "max_norm/layer12": 27.57324981689453, "max_norm/layer13": 23.7674503326416, "max_norm/layer14": 25.660987854003906, "max_norm/layer15": 30.117841720581055, "max_norm/layer16": 25.384872436523438, "max_norm/layer17": 30.02664566040039, "max_norm/layer18": 26.555728912353516, "max_norm/layer19": 25.99490737915039, "max_norm/layer2": 20.0588436126709, "max_norm/layer20": 27.112516403198242, "max_norm/layer21": 26.563764572143555, "max_norm/layer22": 27.413936614990234, "max_norm/layer23": 26.341724395751953, "max_norm/layer3": 24.70960235595703, "max_norm/layer4": 24.425901412963867, "max_norm/layer5": 31.035043716430664, "max_norm/layer6": 21.027484893798828, "max_norm/layer7": 26.281536102294922, "max_norm/layer8": 26.368459701538086, "max_norm/layer9": 26.20467185974121, "mean_norm": 10.494121707975864, "mean_norm/layer0": 10.061342477798462, "mean_norm/layer1": 9.99113255739212, "mean_norm/layer10": 10.348263144493103, "mean_norm/layer11": 10.630640387535095, "mean_norm/layer12": 11.10374128818512, "mean_norm/layer13": 10.32883608341217, "mean_norm/layer14": 10.693177998065948, "mean_norm/layer15": 10.983099639415741, "mean_norm/layer16": 10.415638208389282, "mean_norm/layer17": 10.874902606010437, "mean_norm/layer18": 10.465932965278625, "mean_norm/layer19": 10.507543802261353, "mean_norm/layer2": 8.789079010486603, "mean_norm/layer20": 10.616671085357666, "mean_norm/layer21": 10.572692036628723, "mean_norm/layer22": 11.466717422008514, "mean_norm/layer23": 11.413405001163483, "mean_norm/layer3": 10.890101253986359, "mean_norm/layer4": 9.845227479934692, "mean_norm/layer5": 11.9767746925354, "mean_norm/layer6": 9.41396027803421, "mean_norm/layer7": 9.885132670402527, "mean_norm/layer8": 10.323809742927551, "mean_norm/layer9": 10.26109915971756, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8550 }, { "epoch": 3.57, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4657078075629809, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7177693843841553, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7202, "eval_samples_per_second": 20.563, "eval_steps_per_second": 0.683, "step": 8550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.59, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5612, "max_norm": 31.140310287475586, "max_norm/layer0": 24.02177619934082, "max_norm/layer1": 25.188316345214844, "max_norm/layer10": 26.956527709960938, "max_norm/layer11": 25.21898651123047, "max_norm/layer12": 27.661983489990234, "max_norm/layer13": 23.849395751953125, "max_norm/layer14": 25.733461380004883, "max_norm/layer15": 30.240049362182617, "max_norm/layer16": 25.489137649536133, "max_norm/layer17": 30.150360107421875, "max_norm/layer18": 26.642009735107422, "max_norm/layer19": 26.0812931060791, "max_norm/layer2": 20.112157821655273, "max_norm/layer20": 27.20627212524414, "max_norm/layer21": 26.658498764038086, "max_norm/layer22": 27.516849517822266, "max_norm/layer23": 26.427011489868164, "max_norm/layer3": 24.779708862304688, "max_norm/layer4": 24.51090431213379, "max_norm/layer5": 31.140310287475586, "max_norm/layer6": 21.10075569152832, "max_norm/layer7": 26.379568099975586, "max_norm/layer8": 26.46396827697754, "max_norm/layer9": 26.29374885559082, "mean_norm": 10.504519318540892, "mean_norm/layer0": 10.073370933532715, "mean_norm/layer1": 10.000800788402557, "mean_norm/layer10": 10.357769906520844, "mean_norm/layer11": 10.6414253115654, "mean_norm/layer12": 11.117177963256836, "mean_norm/layer13": 10.33878743648529, "mean_norm/layer14": 10.704220652580261, "mean_norm/layer15": 10.995559275150299, "mean_norm/layer16": 10.425552606582642, "mean_norm/layer17": 10.886011600494385, "mean_norm/layer18": 10.475245594978333, "mean_norm/layer19": 10.51713490486145, "mean_norm/layer2": 8.792496740818024, "mean_norm/layer20": 10.626440286636353, "mean_norm/layer21": 10.582411348819733, "mean_norm/layer22": 11.480081796646118, "mean_norm/layer23": 11.42665684223175, "mean_norm/layer3": 10.903161942958832, "mean_norm/layer4": 9.852953791618347, "mean_norm/layer5": 11.994223237037659, "mean_norm/layer6": 9.419936060905457, "mean_norm/layer7": 9.893079459667206, "mean_norm/layer8": 10.33350384235382, "mean_norm/layer9": 10.270461320877075, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8600 }, { "epoch": 3.59, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46590655585435403, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7106266021728516, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9154, "eval_samples_per_second": 20.226, "eval_steps_per_second": 0.671, "step": 8600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.61, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5816, "max_norm": 31.250791549682617, "max_norm/layer0": 24.110010147094727, "max_norm/layer1": 25.280006408691406, "max_norm/layer10": 27.059661865234375, "max_norm/layer11": 25.282930374145508, "max_norm/layer12": 27.764455795288086, "max_norm/layer13": 23.927961349487305, "max_norm/layer14": 25.809751510620117, "max_norm/layer15": 30.362098693847656, "max_norm/layer16": 25.56882667541504, "max_norm/layer17": 30.28155517578125, "max_norm/layer18": 26.721351623535156, "max_norm/layer19": 26.17807960510254, "max_norm/layer2": 20.16436004638672, "max_norm/layer20": 27.294723510742188, "max_norm/layer21": 26.74715805053711, "max_norm/layer22": 27.608800888061523, "max_norm/layer23": 26.51601219177246, "max_norm/layer3": 24.850908279418945, "max_norm/layer4": 24.58802604675293, "max_norm/layer5": 31.250791549682617, "max_norm/layer6": 21.15802764892578, "max_norm/layer7": 26.47740364074707, "max_norm/layer8": 26.554189682006836, "max_norm/layer9": 26.38273811340332, "mean_norm": 10.515074729919434, "mean_norm/layer0": 10.08557814359665, "mean_norm/layer1": 10.01053923368454, "mean_norm/layer10": 10.367479145526886, "mean_norm/layer11": 10.652198612689972, "mean_norm/layer12": 11.130778849124908, "mean_norm/layer13": 10.348851323127747, "mean_norm/layer14": 10.71534115076065, "mean_norm/layer15": 11.00808185338974, "mean_norm/layer16": 10.435614585876465, "mean_norm/layer17": 10.897213876247406, "mean_norm/layer18": 10.484766364097595, "mean_norm/layer19": 10.527069389820099, "mean_norm/layer2": 8.796098411083221, "mean_norm/layer20": 10.636413216590881, "mean_norm/layer21": 10.592262923717499, "mean_norm/layer22": 11.493712186813354, "mean_norm/layer23": 11.440210998058319, "mean_norm/layer3": 10.916420876979828, "mean_norm/layer4": 9.86082011461258, "mean_norm/layer5": 12.011876881122589, "mean_norm/layer6": 9.425954461097717, "mean_norm/layer7": 9.901139974594116, "mean_norm/layer8": 10.343375980854034, "mean_norm/layer9": 10.27999496459961, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8650 }, { "epoch": 3.61, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46609313588299, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7121775150299072, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.9234, "eval_samples_per_second": 20.212, "eval_steps_per_second": 0.671, "step": 8650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.63, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5695, "max_norm": 31.358867645263672, "max_norm/layer0": 24.205951690673828, "max_norm/layer1": 25.37681770324707, "max_norm/layer10": 27.143234252929688, "max_norm/layer11": 25.367061614990234, "max_norm/layer12": 27.863758087158203, "max_norm/layer13": 24.005512237548828, "max_norm/layer14": 25.879533767700195, "max_norm/layer15": 30.467557907104492, "max_norm/layer16": 25.646121978759766, "max_norm/layer17": 30.41017723083496, "max_norm/layer18": 26.787418365478516, "max_norm/layer19": 26.29683494567871, "max_norm/layer2": 20.221500396728516, "max_norm/layer20": 27.37459945678711, "max_norm/layer21": 26.828081130981445, "max_norm/layer22": 27.710824966430664, "max_norm/layer23": 26.605989456176758, "max_norm/layer3": 24.92000961303711, "max_norm/layer4": 24.675378799438477, "max_norm/layer5": 31.358867645263672, "max_norm/layer6": 21.21007537841797, "max_norm/layer7": 26.560998916625977, "max_norm/layer8": 26.642372131347656, "max_norm/layer9": 26.490453720092773, "mean_norm": 10.525502522786459, "mean_norm/layer0": 10.09764415025711, "mean_norm/layer1": 10.020213961601257, "mean_norm/layer10": 10.37711900472641, "mean_norm/layer11": 10.662993669509888, "mean_norm/layer12": 11.144181966781616, "mean_norm/layer13": 10.35890543460846, "mean_norm/layer14": 10.726293087005615, "mean_norm/layer15": 11.02056634426117, "mean_norm/layer16": 10.445514619350433, "mean_norm/layer17": 10.908413589000702, "mean_norm/layer18": 10.49404126405716, "mean_norm/layer19": 10.536761999130249, "mean_norm/layer2": 8.7996466755867, "mean_norm/layer20": 10.646133005619049, "mean_norm/layer21": 10.602025330066681, "mean_norm/layer22": 11.50708258152008, "mean_norm/layer23": 11.453619003295898, "mean_norm/layer3": 10.929427862167358, "mean_norm/layer4": 9.868574559688568, "mean_norm/layer5": 12.029329001903534, "mean_norm/layer6": 9.431976199150085, "mean_norm/layer7": 9.909065783023834, "mean_norm/layer8": 10.353107631206512, "mean_norm/layer9": 10.289423823356628, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8700 }, { "epoch": 3.63, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46699358732553753, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.709040403366089, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.923, "eval_samples_per_second": 20.213, "eval_steps_per_second": 0.671, "step": 8700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.65, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5743, "max_norm": 31.462026596069336, "max_norm/layer0": 24.306140899658203, "max_norm/layer1": 25.461463928222656, "max_norm/layer10": 27.22161865234375, "max_norm/layer11": 25.44947624206543, "max_norm/layer12": 27.968080520629883, "max_norm/layer13": 24.1011905670166, "max_norm/layer14": 25.971227645874023, "max_norm/layer15": 30.586713790893555, "max_norm/layer16": 25.736255645751953, "max_norm/layer17": 30.536222457885742, "max_norm/layer18": 26.88282585144043, "max_norm/layer19": 26.426443099975586, "max_norm/layer2": 20.280811309814453, "max_norm/layer20": 27.453838348388672, "max_norm/layer21": 26.928016662597656, "max_norm/layer22": 27.80914306640625, "max_norm/layer23": 26.693340301513672, "max_norm/layer3": 24.99188804626465, "max_norm/layer4": 24.771135330200195, "max_norm/layer5": 31.462026596069336, "max_norm/layer6": 21.271432876586914, "max_norm/layer7": 26.657981872558594, "max_norm/layer8": 26.73614501953125, "max_norm/layer9": 26.60494613647461, "mean_norm": 10.53589997192224, "mean_norm/layer0": 10.109680235385895, "mean_norm/layer1": 10.029725313186646, "mean_norm/layer10": 10.386717557907104, "mean_norm/layer11": 10.673824787139893, "mean_norm/layer12": 11.15762722492218, "mean_norm/layer13": 10.36895900964737, "mean_norm/layer14": 10.7372505068779, "mean_norm/layer15": 11.032996237277985, "mean_norm/layer16": 10.455421268939972, "mean_norm/layer17": 10.91942673921585, "mean_norm/layer18": 10.503340184688568, "mean_norm/layer19": 10.546266198158264, "mean_norm/layer2": 8.803168833255768, "mean_norm/layer20": 10.655834794044495, "mean_norm/layer21": 10.611751914024353, "mean_norm/layer22": 11.520513951778412, "mean_norm/layer23": 11.466938018798828, "mean_norm/layer3": 10.942326188087463, "mean_norm/layer4": 9.876272022724152, "mean_norm/layer5": 12.046761870384216, "mean_norm/layer6": 9.438043534755707, "mean_norm/layer7": 9.917055368423462, "mean_norm/layer8": 10.362797379493713, "mean_norm/layer9": 10.298900187015533, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8750 }, { "epoch": 3.65, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4673708034703885, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7044708728790283, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8474, "eval_samples_per_second": 20.342, "eval_steps_per_second": 0.675, "step": 8750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.67, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5789, "max_norm": 31.572891235351562, "max_norm/layer0": 24.410261154174805, "max_norm/layer1": 25.558263778686523, "max_norm/layer10": 27.304840087890625, "max_norm/layer11": 25.51268196105957, "max_norm/layer12": 28.05234146118164, "max_norm/layer13": 24.20308494567871, "max_norm/layer14": 26.0477352142334, "max_norm/layer15": 30.70371437072754, "max_norm/layer16": 25.83902931213379, "max_norm/layer17": 30.648099899291992, "max_norm/layer18": 27.012645721435547, "max_norm/layer19": 26.52737808227539, "max_norm/layer2": 20.334718704223633, "max_norm/layer20": 27.539426803588867, "max_norm/layer21": 27.018211364746094, "max_norm/layer22": 27.9110107421875, "max_norm/layer23": 26.7803955078125, "max_norm/layer3": 25.054349899291992, "max_norm/layer4": 24.855287551879883, "max_norm/layer5": 31.572891235351562, "max_norm/layer6": 21.333072662353516, "max_norm/layer7": 26.76139259338379, "max_norm/layer8": 26.838417053222656, "max_norm/layer9": 26.697357177734375, "mean_norm": 10.5463310405612, "mean_norm/layer0": 10.121755361557007, "mean_norm/layer1": 10.039315283298492, "mean_norm/layer10": 10.396234333515167, "mean_norm/layer11": 10.684642255306244, "mean_norm/layer12": 11.171061992645264, "mean_norm/layer13": 10.37897139787674, "mean_norm/layer14": 10.748344361782074, "mean_norm/layer15": 11.045448780059814, "mean_norm/layer16": 10.465394139289856, "mean_norm/layer17": 10.930562853813171, "mean_norm/layer18": 10.512667119503021, "mean_norm/layer19": 10.55586314201355, "mean_norm/layer2": 8.806701242923737, "mean_norm/layer20": 10.665653467178345, "mean_norm/layer21": 10.621645450592041, "mean_norm/layer22": 11.533875703811646, "mean_norm/layer23": 11.480299174785614, "mean_norm/layer3": 10.955307066440582, "mean_norm/layer4": 9.88407689332962, "mean_norm/layer5": 12.064229130744934, "mean_norm/layer6": 9.444064617156982, "mean_norm/layer7": 9.92504996061325, "mean_norm/layer8": 10.372445940971375, "mean_norm/layer9": 10.308335304260254, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8800 }, { "epoch": 3.67, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4667907829465854, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7064690589904785, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.587, "eval_samples_per_second": 20.799, "eval_steps_per_second": 0.69, "step": 8800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.7, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5744, "max_norm": 31.6871337890625, "max_norm/layer0": 24.510038375854492, "max_norm/layer1": 25.655925750732422, "max_norm/layer10": 27.37701988220215, "max_norm/layer11": 25.585721969604492, "max_norm/layer12": 28.144187927246094, "max_norm/layer13": 24.291133880615234, "max_norm/layer14": 26.127349853515625, "max_norm/layer15": 30.831226348876953, "max_norm/layer16": 25.930320739746094, "max_norm/layer17": 30.755409240722656, "max_norm/layer18": 27.11887550354004, "max_norm/layer19": 26.618364334106445, "max_norm/layer2": 20.38463020324707, "max_norm/layer20": 27.650087356567383, "max_norm/layer21": 27.109182357788086, "max_norm/layer22": 28.00884437561035, "max_norm/layer23": 26.86437225341797, "max_norm/layer3": 25.138376235961914, "max_norm/layer4": 24.935468673706055, "max_norm/layer5": 31.6871337890625, "max_norm/layer6": 21.40496253967285, "max_norm/layer7": 26.854114532470703, "max_norm/layer8": 26.91637420654297, "max_norm/layer9": 26.789180755615234, "mean_norm": 10.556625217199326, "mean_norm/layer0": 10.13366448879242, "mean_norm/layer1": 10.048774302005768, "mean_norm/layer10": 10.405665278434753, "mean_norm/layer11": 10.695261061191559, "mean_norm/layer12": 11.184338688850403, "mean_norm/layer13": 10.388884425163269, "mean_norm/layer14": 10.759207367897034, "mean_norm/layer15": 11.05769032239914, "mean_norm/layer16": 10.475219130516052, "mean_norm/layer17": 10.94150424003601, "mean_norm/layer18": 10.5219966173172, "mean_norm/layer19": 10.565406024456024, "mean_norm/layer2": 8.810097455978394, "mean_norm/layer20": 10.675190091133118, "mean_norm/layer21": 10.631307899951935, "mean_norm/layer22": 11.547064244747162, "mean_norm/layer23": 11.493385910987854, "mean_norm/layer3": 10.968357741832733, "mean_norm/layer4": 9.891835868358612, "mean_norm/layer5": 12.081561923027039, "mean_norm/layer6": 9.449971437454224, "mean_norm/layer7": 9.932962834835052, "mean_norm/layer8": 10.38201367855072, "mean_norm/layer9": 10.31764417886734, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8850 }, { "epoch": 3.7, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46575242452635035, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7084460258483887, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8044, "eval_samples_per_second": 22.306, "eval_steps_per_second": 0.74, "step": 8850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.72, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5773, "max_norm": 31.805294036865234, "max_norm/layer0": 24.599546432495117, "max_norm/layer1": 25.76319122314453, "max_norm/layer10": 27.449440002441406, "max_norm/layer11": 25.655227661132812, "max_norm/layer12": 28.233400344848633, "max_norm/layer13": 24.394102096557617, "max_norm/layer14": 26.187408447265625, "max_norm/layer15": 30.92896270751953, "max_norm/layer16": 26.01325035095215, "max_norm/layer17": 30.859031677246094, "max_norm/layer18": 27.204809188842773, "max_norm/layer19": 26.70510482788086, "max_norm/layer2": 20.445926666259766, "max_norm/layer20": 27.740930557250977, "max_norm/layer21": 27.208942413330078, "max_norm/layer22": 28.095291137695312, "max_norm/layer23": 26.942819595336914, "max_norm/layer3": 25.220661163330078, "max_norm/layer4": 25.003028869628906, "max_norm/layer5": 31.805294036865234, "max_norm/layer6": 21.47049903869629, "max_norm/layer7": 26.94700813293457, "max_norm/layer8": 27.007118225097656, "max_norm/layer9": 26.882286071777344, "mean_norm": 10.566929931441942, "mean_norm/layer0": 10.145540177822113, "mean_norm/layer1": 10.058104574680328, "mean_norm/layer10": 10.41511994600296, "mean_norm/layer11": 10.705998122692108, "mean_norm/layer12": 11.197706997394562, "mean_norm/layer13": 10.398730218410492, "mean_norm/layer14": 10.770055413246155, "mean_norm/layer15": 11.06999284029007, "mean_norm/layer16": 10.485083758831024, "mean_norm/layer17": 10.9524467587471, "mean_norm/layer18": 10.53134435415268, "mean_norm/layer19": 10.57489550113678, "mean_norm/layer2": 8.813579618930817, "mean_norm/layer20": 10.684813797473907, "mean_norm/layer21": 10.640975952148438, "mean_norm/layer22": 11.560323774814606, "mean_norm/layer23": 11.50652539730072, "mean_norm/layer3": 10.9813032746315, "mean_norm/layer4": 9.899572908878326, "mean_norm/layer5": 12.098863184452057, "mean_norm/layer6": 9.455974757671356, "mean_norm/layer7": 9.940803170204163, "mean_norm/layer8": 10.391590774059296, "mean_norm/layer9": 10.32697308063507, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8900 }, { "epoch": 3.72, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46607691153267383, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.708861827850342, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8238, "eval_samples_per_second": 20.383, "eval_steps_per_second": 0.677, "step": 8900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.74, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5772, "max_norm": 31.916152954101562, "max_norm/layer0": 24.676496505737305, "max_norm/layer1": 25.85756492614746, "max_norm/layer10": 27.528053283691406, "max_norm/layer11": 25.73573112487793, "max_norm/layer12": 28.318124771118164, "max_norm/layer13": 24.479642868041992, "max_norm/layer14": 26.248197555541992, "max_norm/layer15": 31.052705764770508, "max_norm/layer16": 26.09161376953125, "max_norm/layer17": 30.966751098632812, "max_norm/layer18": 27.3068790435791, "max_norm/layer19": 26.7965145111084, "max_norm/layer2": 20.522724151611328, "max_norm/layer20": 27.823123931884766, "max_norm/layer21": 27.323970794677734, "max_norm/layer22": 28.17957878112793, "max_norm/layer23": 27.034547805786133, "max_norm/layer3": 25.299671173095703, "max_norm/layer4": 25.082792282104492, "max_norm/layer5": 31.916152954101562, "max_norm/layer6": 21.534683227539062, "max_norm/layer7": 27.028034210205078, "max_norm/layer8": 27.088815689086914, "max_norm/layer9": 26.969919204711914, "mean_norm": 10.577225059270859, "mean_norm/layer0": 10.157378554344177, "mean_norm/layer1": 10.067561268806458, "mean_norm/layer10": 10.424581110477448, "mean_norm/layer11": 10.716570019721985, "mean_norm/layer12": 11.210873186588287, "mean_norm/layer13": 10.408523380756378, "mean_norm/layer14": 10.78095543384552, "mean_norm/layer15": 11.082448303699493, "mean_norm/layer16": 10.494913518428802, "mean_norm/layer17": 10.963443398475647, "mean_norm/layer18": 10.540624141693115, "mean_norm/layer19": 10.584456026554108, "mean_norm/layer2": 8.81709498167038, "mean_norm/layer20": 10.694341719150543, "mean_norm/layer21": 10.650606751441956, "mean_norm/layer22": 11.573448956012726, "mean_norm/layer23": 11.51974767446518, "mean_norm/layer3": 10.994216620922089, "mean_norm/layer4": 9.90748655796051, "mean_norm/layer5": 12.11613380908966, "mean_norm/layer6": 9.461788892745972, "mean_norm/layer7": 9.948690056800842, "mean_norm/layer8": 10.401232063770294, "mean_norm/layer9": 10.33628499507904, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 8950 }, { "epoch": 3.74, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4669814190628004, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7066380977630615, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8434, "eval_samples_per_second": 20.349, "eval_steps_per_second": 0.675, "step": 8950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.76, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5866, "max_norm": 32.025630950927734, "max_norm/layer0": 24.762939453125, "max_norm/layer1": 25.960861206054688, "max_norm/layer10": 27.613296508789062, "max_norm/layer11": 25.807106018066406, "max_norm/layer12": 28.428152084350586, "max_norm/layer13": 24.579200744628906, "max_norm/layer14": 26.320199966430664, "max_norm/layer15": 31.175045013427734, "max_norm/layer16": 26.178552627563477, "max_norm/layer17": 31.0894832611084, "max_norm/layer18": 27.412567138671875, "max_norm/layer19": 26.8818359375, "max_norm/layer2": 20.595802307128906, "max_norm/layer20": 27.916038513183594, "max_norm/layer21": 27.415224075317383, "max_norm/layer22": 28.27640151977539, "max_norm/layer23": 27.122173309326172, "max_norm/layer3": 25.38041877746582, "max_norm/layer4": 25.15086555480957, "max_norm/layer5": 32.025630950927734, "max_norm/layer6": 21.594274520874023, "max_norm/layer7": 27.11809730529785, "max_norm/layer8": 27.185285568237305, "max_norm/layer9": 27.044723510742188, "mean_norm": 10.587412876387438, "mean_norm/layer0": 10.168988108634949, "mean_norm/layer1": 10.076943039894104, "mean_norm/layer10": 10.433831512928009, "mean_norm/layer11": 10.72713315486908, "mean_norm/layer12": 11.22397780418396, "mean_norm/layer13": 10.418285012245178, "mean_norm/layer14": 10.791641414165497, "mean_norm/layer15": 11.094760477542877, "mean_norm/layer16": 10.504680275917053, "mean_norm/layer17": 10.974333047866821, "mean_norm/layer18": 10.549786627292633, "mean_norm/layer19": 10.594055414199829, "mean_norm/layer2": 8.820539593696594, "mean_norm/layer20": 10.703791201114655, "mean_norm/layer21": 10.660218596458435, "mean_norm/layer22": 11.586527645587921, "mean_norm/layer23": 11.532706141471863, "mean_norm/layer3": 11.007036626338959, "mean_norm/layer4": 9.915196359157562, "mean_norm/layer5": 12.133186936378479, "mean_norm/layer6": 9.467587530612946, "mean_norm/layer7": 9.95652425289154, "mean_norm/layer8": 10.41076546907425, "mean_norm/layer9": 10.345412790775299, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9000 }, { "epoch": 3.76, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46787375833018985, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7035961151123047, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8396, "eval_samples_per_second": 20.355, "eval_steps_per_second": 0.676, "step": 9000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.78, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5766, "max_norm": 32.134735107421875, "max_norm/layer0": 24.84881019592285, "max_norm/layer1": 26.05401611328125, "max_norm/layer10": 27.689804077148438, "max_norm/layer11": 25.87973976135254, "max_norm/layer12": 28.52071762084961, "max_norm/layer13": 24.691492080688477, "max_norm/layer14": 26.403806686401367, "max_norm/layer15": 31.284221649169922, "max_norm/layer16": 26.256942749023438, "max_norm/layer17": 31.221664428710938, "max_norm/layer18": 27.5086612701416, "max_norm/layer19": 26.977436065673828, "max_norm/layer2": 20.662620544433594, "max_norm/layer20": 28.005910873413086, "max_norm/layer21": 27.506736755371094, "max_norm/layer22": 28.381319046020508, "max_norm/layer23": 27.205909729003906, "max_norm/layer3": 25.46193504333496, "max_norm/layer4": 25.2278995513916, "max_norm/layer5": 32.134735107421875, "max_norm/layer6": 21.648170471191406, "max_norm/layer7": 27.21436309814453, "max_norm/layer8": 27.268877029418945, "max_norm/layer9": 27.110942840576172, "mean_norm": 10.597499750554562, "mean_norm/layer0": 10.180612981319427, "mean_norm/layer1": 10.086312234401703, "mean_norm/layer10": 10.443076193332672, "mean_norm/layer11": 10.737610340118408, "mean_norm/layer12": 11.236975133419037, "mean_norm/layer13": 10.427858173847198, "mean_norm/layer14": 10.802227020263672, "mean_norm/layer15": 11.106768071651459, "mean_norm/layer16": 10.514285862445831, "mean_norm/layer17": 10.985120475292206, "mean_norm/layer18": 10.558781325817108, "mean_norm/layer19": 10.603352129459381, "mean_norm/layer2": 8.823948740959167, "mean_norm/layer20": 10.713205635547638, "mean_norm/layer21": 10.66967099905014, "mean_norm/layer22": 11.59945923089981, "mean_norm/layer23": 11.545632243156433, "mean_norm/layer3": 11.019707977771759, "mean_norm/layer4": 9.9228515625, "mean_norm/layer5": 12.150153994560242, "mean_norm/layer6": 9.473384976387024, "mean_norm/layer7": 9.96427607536316, "mean_norm/layer8": 10.420209109783173, "mean_norm/layer9": 10.35451352596283, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9050 }, { "epoch": 3.78, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46858357365652237, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7019236087799072, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8097, "eval_samples_per_second": 20.407, "eval_steps_per_second": 0.677, "step": 9050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.8, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5811, "max_norm": 32.24896240234375, "max_norm/layer0": 24.925283432006836, "max_norm/layer1": 26.151309967041016, "max_norm/layer10": 27.78043556213379, "max_norm/layer11": 25.97683334350586, "max_norm/layer12": 28.626747131347656, "max_norm/layer13": 24.789648056030273, "max_norm/layer14": 26.49995231628418, "max_norm/layer15": 31.411869049072266, "max_norm/layer16": 26.331775665283203, "max_norm/layer17": 31.348556518554688, "max_norm/layer18": 27.602380752563477, "max_norm/layer19": 27.07625389099121, "max_norm/layer2": 20.733642578125, "max_norm/layer20": 28.101778030395508, "max_norm/layer21": 27.597261428833008, "max_norm/layer22": 28.473896026611328, "max_norm/layer23": 27.283172607421875, "max_norm/layer3": 25.54083251953125, "max_norm/layer4": 25.305072784423828, "max_norm/layer5": 32.24896240234375, "max_norm/layer6": 21.698518753051758, "max_norm/layer7": 27.31633758544922, "max_norm/layer8": 27.362085342407227, "max_norm/layer9": 27.174236297607422, "mean_norm": 10.60761951158444, "mean_norm/layer0": 10.192138016223907, "mean_norm/layer1": 10.095690608024597, "mean_norm/layer10": 10.45243376493454, "mean_norm/layer11": 10.748098969459534, "mean_norm/layer12": 11.250001728534698, "mean_norm/layer13": 10.4375701546669, "mean_norm/layer14": 10.812869429588318, "mean_norm/layer15": 11.118857681751251, "mean_norm/layer16": 10.523910284042358, "mean_norm/layer17": 10.995957911014557, "mean_norm/layer18": 10.567832112312317, "mean_norm/layer19": 10.61269599199295, "mean_norm/layer2": 8.82736986875534, "mean_norm/layer20": 10.722554564476013, "mean_norm/layer21": 10.679236650466919, "mean_norm/layer22": 11.612319529056549, "mean_norm/layer23": 11.558498978614807, "mean_norm/layer3": 11.032294690608978, "mean_norm/layer4": 9.93044263124466, "mean_norm/layer5": 12.167267978191376, "mean_norm/layer6": 9.479266583919525, "mean_norm/layer7": 9.972204864025116, "mean_norm/layer8": 10.429711878299713, "mean_norm/layer9": 10.363643407821655, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9100 }, { "epoch": 3.8, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4681252357600905, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6967613697052, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8279, "eval_samples_per_second": 20.376, "eval_steps_per_second": 0.676, "step": 9100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.82, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5825, "max_norm": 32.35498046875, "max_norm/layer0": 25.00909996032715, "max_norm/layer1": 26.24652862548828, "max_norm/layer10": 27.876937866210938, "max_norm/layer11": 26.062362670898438, "max_norm/layer12": 28.732330322265625, "max_norm/layer13": 24.885143280029297, "max_norm/layer14": 26.589519500732422, "max_norm/layer15": 31.518461227416992, "max_norm/layer16": 26.398515701293945, "max_norm/layer17": 31.479341506958008, "max_norm/layer18": 27.692447662353516, "max_norm/layer19": 27.19039535522461, "max_norm/layer2": 20.811538696289062, "max_norm/layer20": 28.179485321044922, "max_norm/layer21": 27.66974639892578, "max_norm/layer22": 28.55803108215332, "max_norm/layer23": 27.369035720825195, "max_norm/layer3": 25.627965927124023, "max_norm/layer4": 25.377857208251953, "max_norm/layer5": 32.35498046875, "max_norm/layer6": 21.744564056396484, "max_norm/layer7": 27.417688369750977, "max_norm/layer8": 27.45230484008789, "max_norm/layer9": 27.24327278137207, "mean_norm": 10.617767485479513, "mean_norm/layer0": 10.20370638370514, "mean_norm/layer1": 10.105073094367981, "mean_norm/layer10": 10.461777687072754, "mean_norm/layer11": 10.758564233779907, "mean_norm/layer12": 11.263149619102478, "mean_norm/layer13": 10.447303175926208, "mean_norm/layer14": 10.823521196842194, "mean_norm/layer15": 11.131090462207794, "mean_norm/layer16": 10.533623218536377, "mean_norm/layer17": 11.006788909435272, "mean_norm/layer18": 10.576985120773315, "mean_norm/layer19": 10.621982991695404, "mean_norm/layer2": 8.830790042877197, "mean_norm/layer20": 10.73173063993454, "mean_norm/layer21": 10.688687920570374, "mean_norm/layer22": 11.625361859798431, "mean_norm/layer23": 11.57146829366684, "mean_norm/layer3": 11.044941544532776, "mean_norm/layer4": 9.938095211982727, "mean_norm/layer5": 12.18439656496048, "mean_norm/layer6": 9.485150754451752, "mean_norm/layer7": 9.980055332183838, "mean_norm/layer8": 10.43933492898941, "mean_norm/layer9": 10.372840464115143, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9150 }, { "epoch": 3.82, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4689972945895848, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.69665265083313, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8286, "eval_samples_per_second": 20.374, "eval_steps_per_second": 0.676, "step": 9150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.84, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.58, "max_norm": 32.470787048339844, "max_norm/layer0": 25.096399307250977, "max_norm/layer1": 26.337860107421875, "max_norm/layer10": 27.961523056030273, "max_norm/layer11": 26.16880989074707, "max_norm/layer12": 28.851654052734375, "max_norm/layer13": 24.98517608642578, "max_norm/layer14": 26.683137893676758, "max_norm/layer15": 31.63360023498535, "max_norm/layer16": 26.46404457092285, "max_norm/layer17": 31.591623306274414, "max_norm/layer18": 27.78776741027832, "max_norm/layer19": 27.291912078857422, "max_norm/layer2": 20.879919052124023, "max_norm/layer20": 28.259227752685547, "max_norm/layer21": 27.76218605041504, "max_norm/layer22": 28.638896942138672, "max_norm/layer23": 27.45287322998047, "max_norm/layer3": 25.71695899963379, "max_norm/layer4": 25.455402374267578, "max_norm/layer5": 32.470787048339844, "max_norm/layer6": 21.793964385986328, "max_norm/layer7": 27.533058166503906, "max_norm/layer8": 27.53644561767578, "max_norm/layer9": 27.302696228027344, "mean_norm": 10.627832487225533, "mean_norm/layer0": 10.215189158916473, "mean_norm/layer1": 10.114474654197693, "mean_norm/layer10": 10.471054553985596, "mean_norm/layer11": 10.768976330757141, "mean_norm/layer12": 11.276058495044708, "mean_norm/layer13": 10.456969678401947, "mean_norm/layer14": 10.834083795547485, "mean_norm/layer15": 11.143160045146942, "mean_norm/layer16": 10.543258905410767, "mean_norm/layer17": 11.017536640167236, "mean_norm/layer18": 10.586021959781647, "mean_norm/layer19": 10.631254851818085, "mean_norm/layer2": 8.834143280982971, "mean_norm/layer20": 10.741076946258545, "mean_norm/layer21": 10.698038101196289, "mean_norm/layer22": 11.63832575082779, "mean_norm/layer23": 11.584293246269226, "mean_norm/layer3": 11.057526648044586, "mean_norm/layer4": 9.945752322673798, "mean_norm/layer5": 12.201387524604797, "mean_norm/layer6": 9.490907371044159, "mean_norm/layer7": 9.987753689289093, "mean_norm/layer8": 10.448831021785736, "mean_norm/layer9": 10.38190472126007, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9200 }, { "epoch": 3.84, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4678656461550318, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.699800729751587, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6274, "eval_samples_per_second": 20.727, "eval_steps_per_second": 0.688, "step": 9200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.86, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5811, "max_norm": 32.58055877685547, "max_norm/layer0": 25.184913635253906, "max_norm/layer1": 26.429561614990234, "max_norm/layer10": 28.046606063842773, "max_norm/layer11": 26.280040740966797, "max_norm/layer12": 28.957191467285156, "max_norm/layer13": 25.079774856567383, "max_norm/layer14": 26.769201278686523, "max_norm/layer15": 31.73074722290039, "max_norm/layer16": 26.54261589050293, "max_norm/layer17": 31.711532592773438, "max_norm/layer18": 27.88140869140625, "max_norm/layer19": 27.393001556396484, "max_norm/layer2": 20.94183921813965, "max_norm/layer20": 28.350820541381836, "max_norm/layer21": 27.87078285217285, "max_norm/layer22": 28.729032516479492, "max_norm/layer23": 27.542428970336914, "max_norm/layer3": 25.806852340698242, "max_norm/layer4": 25.527923583984375, "max_norm/layer5": 32.58055877685547, "max_norm/layer6": 21.839183807373047, "max_norm/layer7": 27.622976303100586, "max_norm/layer8": 27.621929168701172, "max_norm/layer9": 27.380239486694336, "mean_norm": 10.637928095956644, "mean_norm/layer0": 10.226729273796082, "mean_norm/layer1": 10.123919010162354, "mean_norm/layer10": 10.480370283126831, "mean_norm/layer11": 10.779435157775879, "mean_norm/layer12": 11.289127767086029, "mean_norm/layer13": 10.466708064079285, "mean_norm/layer14": 10.844647407531738, "mean_norm/layer15": 11.155323445796967, "mean_norm/layer16": 10.55289614200592, "mean_norm/layer17": 11.028343617916107, "mean_norm/layer18": 10.595082998275757, "mean_norm/layer19": 10.640502452850342, "mean_norm/layer2": 8.8375204205513, "mean_norm/layer20": 10.750492691993713, "mean_norm/layer21": 10.707438945770264, "mean_norm/layer22": 11.651351392269135, "mean_norm/layer23": 11.597171068191528, "mean_norm/layer3": 11.070042908191681, "mean_norm/layer4": 9.953387081623077, "mean_norm/layer5": 12.218364238739014, "mean_norm/layer6": 9.496791005134583, "mean_norm/layer7": 9.995419442653656, "mean_norm/layer8": 10.458230197429657, "mean_norm/layer9": 10.390979290008545, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9250 }, { "epoch": 3.86, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46845783494157206, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.69732403755188, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.7995, "eval_samples_per_second": 22.316, "eval_steps_per_second": 0.741, "step": 9250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.88, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5798, "max_norm": 32.68303298950195, "max_norm/layer0": 25.272388458251953, "max_norm/layer1": 26.51814079284668, "max_norm/layer10": 28.143573760986328, "max_norm/layer11": 26.36440658569336, "max_norm/layer12": 29.06740379333496, "max_norm/layer13": 25.197477340698242, "max_norm/layer14": 26.863147735595703, "max_norm/layer15": 31.821640014648438, "max_norm/layer16": 26.632102966308594, "max_norm/layer17": 31.83808708190918, "max_norm/layer18": 27.988380432128906, "max_norm/layer19": 27.489473342895508, "max_norm/layer2": 21.011850357055664, "max_norm/layer20": 28.4365291595459, "max_norm/layer21": 27.981365203857422, "max_norm/layer22": 28.814743041992188, "max_norm/layer23": 27.636215209960938, "max_norm/layer3": 25.881065368652344, "max_norm/layer4": 25.616458892822266, "max_norm/layer5": 32.68303298950195, "max_norm/layer6": 21.897836685180664, "max_norm/layer7": 27.713808059692383, "max_norm/layer8": 27.703105926513672, "max_norm/layer9": 27.458404541015625, "mean_norm": 10.647937004764875, "mean_norm/layer0": 10.238056540489197, "mean_norm/layer1": 10.133143305778503, "mean_norm/layer10": 10.489564597606659, "mean_norm/layer11": 10.789824903011322, "mean_norm/layer12": 11.302159667015076, "mean_norm/layer13": 10.476322174072266, "mean_norm/layer14": 10.855113446712494, "mean_norm/layer15": 11.167461931705475, "mean_norm/layer16": 10.562495648860931, "mean_norm/layer17": 11.03900271654129, "mean_norm/layer18": 10.604086875915527, "mean_norm/layer19": 10.649737179279327, "mean_norm/layer2": 8.840841054916382, "mean_norm/layer20": 10.759805142879486, "mean_norm/layer21": 10.716701686382294, "mean_norm/layer22": 11.664154350757599, "mean_norm/layer23": 11.609936714172363, "mean_norm/layer3": 11.082544147968292, "mean_norm/layer4": 9.9610356092453, "mean_norm/layer5": 12.235257029533386, "mean_norm/layer6": 9.502565085887909, "mean_norm/layer7": 10.003019213676453, "mean_norm/layer8": 10.467623889446259, "mean_norm/layer9": 10.400035202503204, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9300 }, { "epoch": 3.88, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46830775970114746, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7002856731414795, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8184, "eval_samples_per_second": 22.277, "eval_steps_per_second": 0.739, "step": 9300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.9, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5664, "max_norm": 32.782840728759766, "max_norm/layer0": 25.365907669067383, "max_norm/layer1": 26.609689712524414, "max_norm/layer10": 28.237533569335938, "max_norm/layer11": 26.454559326171875, "max_norm/layer12": 29.165164947509766, "max_norm/layer13": 25.313295364379883, "max_norm/layer14": 26.973520278930664, "max_norm/layer15": 31.91727066040039, "max_norm/layer16": 26.71632194519043, "max_norm/layer17": 31.9581241607666, "max_norm/layer18": 28.106477737426758, "max_norm/layer19": 27.586517333984375, "max_norm/layer2": 21.090667724609375, "max_norm/layer20": 28.518213272094727, "max_norm/layer21": 28.0922794342041, "max_norm/layer22": 28.909934997558594, "max_norm/layer23": 27.714889526367188, "max_norm/layer3": 25.95438575744629, "max_norm/layer4": 25.699705123901367, "max_norm/layer5": 32.782840728759766, "max_norm/layer6": 21.94924545288086, "max_norm/layer7": 27.81015968322754, "max_norm/layer8": 27.77658462524414, "max_norm/layer9": 27.53354835510254, "mean_norm": 10.658011309802532, "mean_norm/layer0": 10.24942147731781, "mean_norm/layer1": 10.14245593547821, "mean_norm/layer10": 10.498845994472504, "mean_norm/layer11": 10.800289332866669, "mean_norm/layer12": 11.315202176570892, "mean_norm/layer13": 10.485957622528076, "mean_norm/layer14": 10.865731239318848, "mean_norm/layer15": 11.179639279842377, "mean_norm/layer16": 10.572109937667847, "mean_norm/layer17": 11.049724102020264, "mean_norm/layer18": 10.613103151321411, "mean_norm/layer19": 10.658956408500671, "mean_norm/layer2": 8.844276249408722, "mean_norm/layer20": 10.769253730773926, "mean_norm/layer21": 10.72613674402237, "mean_norm/layer22": 11.676981389522552, "mean_norm/layer23": 11.622842133045197, "mean_norm/layer3": 11.095019221305847, "mean_norm/layer4": 9.96867686510086, "mean_norm/layer5": 12.25225579738617, "mean_norm/layer6": 9.508372902870178, "mean_norm/layer7": 10.010667264461517, "mean_norm/layer8": 10.477143466472626, "mean_norm/layer9": 10.40920901298523, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9350 }, { "epoch": 3.9, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4693461181213825, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6948671340942383, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8372, "eval_samples_per_second": 20.36, "eval_steps_per_second": 0.676, "step": 9350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.92, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5755, "max_norm": 32.886863708496094, "max_norm/layer0": 25.44892120361328, "max_norm/layer1": 26.69940757751465, "max_norm/layer10": 28.33182144165039, "max_norm/layer11": 26.536706924438477, "max_norm/layer12": 29.27495002746582, "max_norm/layer13": 25.407133102416992, "max_norm/layer14": 27.068056106567383, "max_norm/layer15": 32.01877975463867, "max_norm/layer16": 26.809919357299805, "max_norm/layer17": 32.068660736083984, "max_norm/layer18": 28.212785720825195, "max_norm/layer19": 27.692922592163086, "max_norm/layer2": 21.16015625, "max_norm/layer20": 28.613033294677734, "max_norm/layer21": 28.182695388793945, "max_norm/layer22": 29.009483337402344, "max_norm/layer23": 27.800437927246094, "max_norm/layer3": 26.028907775878906, "max_norm/layer4": 25.79058837890625, "max_norm/layer5": 32.886863708496094, "max_norm/layer6": 22.01177978515625, "max_norm/layer7": 27.899147033691406, "max_norm/layer8": 27.851360321044922, "max_norm/layer9": 27.61525535583496, "mean_norm": 10.668005446592966, "mean_norm/layer0": 10.260759949684143, "mean_norm/layer1": 10.15172153711319, "mean_norm/layer10": 10.508157014846802, "mean_norm/layer11": 10.810645937919617, "mean_norm/layer12": 11.328147649765015, "mean_norm/layer13": 10.495525300502777, "mean_norm/layer14": 10.876251876354218, "mean_norm/layer15": 11.191632449626923, "mean_norm/layer16": 10.58162671327591, "mean_norm/layer17": 11.06039971113205, "mean_norm/layer18": 10.622076153755188, "mean_norm/layer19": 10.668111145496368, "mean_norm/layer2": 8.847656607627869, "mean_norm/layer20": 10.778528094291687, "mean_norm/layer21": 10.735529243946075, "mean_norm/layer22": 11.689706325531006, "mean_norm/layer23": 11.635596692562103, "mean_norm/layer3": 11.107528388500214, "mean_norm/layer4": 9.976164162158966, "mean_norm/layer5": 12.269051373004913, "mean_norm/layer6": 9.51415604352951, "mean_norm/layer7": 10.01818311214447, "mean_norm/layer8": 10.486587703227997, "mean_norm/layer9": 10.418387532234192, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9400 }, { "epoch": 3.92, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4681495722855648, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6942684650421143, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6432, "eval_samples_per_second": 20.699, "eval_steps_per_second": 0.687, "step": 9400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.95, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.573, "max_norm": 33.00111389160156, "max_norm/layer0": 25.53734016418457, "max_norm/layer1": 26.78814125061035, "max_norm/layer10": 28.42632293701172, "max_norm/layer11": 26.61481475830078, "max_norm/layer12": 29.382888793945312, "max_norm/layer13": 25.50127601623535, "max_norm/layer14": 27.171720504760742, "max_norm/layer15": 32.12615966796875, "max_norm/layer16": 26.910057067871094, "max_norm/layer17": 32.16920852661133, "max_norm/layer18": 28.307641983032227, "max_norm/layer19": 27.791166305541992, "max_norm/layer2": 21.225391387939453, "max_norm/layer20": 28.681900024414062, "max_norm/layer21": 28.29361915588379, "max_norm/layer22": 29.12259292602539, "max_norm/layer23": 27.881290435791016, "max_norm/layer3": 26.104650497436523, "max_norm/layer4": 25.875703811645508, "max_norm/layer5": 33.00111389160156, "max_norm/layer6": 22.065937042236328, "max_norm/layer7": 28.001384735107422, "max_norm/layer8": 27.930898666381836, "max_norm/layer9": 27.698144912719727, "mean_norm": 10.67796295384566, "mean_norm/layer0": 10.27203243970871, "mean_norm/layer1": 10.161053121089935, "mean_norm/layer10": 10.51726907491684, "mean_norm/layer11": 10.820999085903168, "mean_norm/layer12": 11.341056287288666, "mean_norm/layer13": 10.505224525928497, "mean_norm/layer14": 10.886779367923737, "mean_norm/layer15": 11.20365023612976, "mean_norm/layer16": 10.591172337532043, "mean_norm/layer17": 11.071096956729889, "mean_norm/layer18": 10.631023526191711, "mean_norm/layer19": 10.677245795726776, "mean_norm/layer2": 8.850984394550323, "mean_norm/layer20": 10.787645399570465, "mean_norm/layer21": 10.744815289974213, "mean_norm/layer22": 11.702471911907196, "mean_norm/layer23": 11.648136258125305, "mean_norm/layer3": 11.11998337507248, "mean_norm/layer4": 9.983684122562408, "mean_norm/layer5": 12.285788357257843, "mean_norm/layer6": 9.519932866096497, "mean_norm/layer7": 10.02573847770691, "mean_norm/layer8": 10.495937168598175, "mean_norm/layer9": 10.42739051580429, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9450 }, { "epoch": 3.95, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4690256872026381, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6952497959136963, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.846, "eval_samples_per_second": 20.344, "eval_steps_per_second": 0.675, "step": 9450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.97, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5826, "max_norm": 33.11233139038086, "max_norm/layer0": 25.61636734008789, "max_norm/layer1": 26.879316329956055, "max_norm/layer10": 28.511680603027344, "max_norm/layer11": 26.70820426940918, "max_norm/layer12": 29.474576950073242, "max_norm/layer13": 25.595924377441406, "max_norm/layer14": 27.25803565979004, "max_norm/layer15": 32.24443817138672, "max_norm/layer16": 27.010766983032227, "max_norm/layer17": 32.268558502197266, "max_norm/layer18": 28.439178466796875, "max_norm/layer19": 27.8987979888916, "max_norm/layer2": 21.282726287841797, "max_norm/layer20": 28.772045135498047, "max_norm/layer21": 28.373287200927734, "max_norm/layer22": 29.23287010192871, "max_norm/layer23": 27.96897315979004, "max_norm/layer3": 26.182008743286133, "max_norm/layer4": 25.959827423095703, "max_norm/layer5": 33.11233139038086, "max_norm/layer6": 22.129119873046875, "max_norm/layer7": 28.099084854125977, "max_norm/layer8": 28.009950637817383, "max_norm/layer9": 27.775909423828125, "mean_norm": 10.688044652342796, "mean_norm/layer0": 10.283402860164642, "mean_norm/layer1": 10.17039829492569, "mean_norm/layer10": 10.52660220861435, "mean_norm/layer11": 10.831436216831207, "mean_norm/layer12": 11.354080498218536, "mean_norm/layer13": 10.514998495578766, "mean_norm/layer14": 10.89742910861969, "mean_norm/layer15": 11.215672731399536, "mean_norm/layer16": 10.600797593593597, "mean_norm/layer17": 11.081857025623322, "mean_norm/layer18": 10.640068292617798, "mean_norm/layer19": 10.686591744422913, "mean_norm/layer2": 8.854361951351166, "mean_norm/layer20": 10.796972274780273, "mean_norm/layer21": 10.754287958145142, "mean_norm/layer22": 11.71543425321579, "mean_norm/layer23": 11.660886287689209, "mean_norm/layer3": 11.13255774974823, "mean_norm/layer4": 9.991296291351318, "mean_norm/layer5": 12.302757441997528, "mean_norm/layer6": 9.525744915008545, "mean_norm/layer7": 10.033455848693848, "mean_norm/layer8": 10.505375623703003, "mean_norm/layer9": 10.436605989933014, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9500 }, { "epoch": 3.97, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46980445601781434, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6896309852600098, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6117, "eval_samples_per_second": 20.755, "eval_steps_per_second": 0.689, "step": 9500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 3.99, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5845, "max_norm": 33.22111511230469, "max_norm/layer0": 25.70020866394043, "max_norm/layer1": 26.959239959716797, "max_norm/layer10": 28.604167938232422, "max_norm/layer11": 26.803647994995117, "max_norm/layer12": 29.598041534423828, "max_norm/layer13": 25.70684051513672, "max_norm/layer14": 27.33949851989746, "max_norm/layer15": 32.35847473144531, "max_norm/layer16": 27.094337463378906, "max_norm/layer17": 32.37206268310547, "max_norm/layer18": 28.551963806152344, "max_norm/layer19": 28.00347900390625, "max_norm/layer2": 21.350160598754883, "max_norm/layer20": 28.8660888671875, "max_norm/layer21": 28.463394165039062, "max_norm/layer22": 29.33779525756836, "max_norm/layer23": 28.057477951049805, "max_norm/layer3": 26.272552490234375, "max_norm/layer4": 26.05592155456543, "max_norm/layer5": 33.22111511230469, "max_norm/layer6": 22.20157814025879, "max_norm/layer7": 28.201513290405273, "max_norm/layer8": 28.098514556884766, "max_norm/layer9": 27.844715118408203, "mean_norm": 10.698029942810535, "mean_norm/layer0": 10.294709742069244, "mean_norm/layer1": 10.179706275463104, "mean_norm/layer10": 10.535793900489807, "mean_norm/layer11": 10.841690242290497, "mean_norm/layer12": 11.367003858089447, "mean_norm/layer13": 10.524603307247162, "mean_norm/layer14": 10.90799218416214, "mean_norm/layer15": 11.227812469005585, "mean_norm/layer16": 10.610308766365051, "mean_norm/layer17": 11.092499136924744, "mean_norm/layer18": 10.648983716964722, "mean_norm/layer19": 10.695793569087982, "mean_norm/layer2": 8.85766851902008, "mean_norm/layer20": 10.806212484836578, "mean_norm/layer21": 10.76362019777298, "mean_norm/layer22": 11.728101670742035, "mean_norm/layer23": 11.673562049865723, "mean_norm/layer3": 11.145098149776459, "mean_norm/layer4": 9.99885606765747, "mean_norm/layer5": 12.319611668586731, "mean_norm/layer6": 9.53151524066925, "mean_norm/layer7": 10.041094720363617, "mean_norm/layer8": 10.514805734157562, "mean_norm/layer9": 10.44567495584488, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9550 }, { "epoch": 3.99, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4687012001963146, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6940293312072754, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8271, "eval_samples_per_second": 20.377, "eval_steps_per_second": 0.676, "step": 9550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.01, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5008, "max_norm": 33.330360412597656, "max_norm/layer0": 25.78761100769043, "max_norm/layer1": 27.03449821472168, "max_norm/layer10": 28.674245834350586, "max_norm/layer11": 26.880537033081055, "max_norm/layer12": 29.694679260253906, "max_norm/layer13": 25.82834243774414, "max_norm/layer14": 27.425241470336914, "max_norm/layer15": 32.486995697021484, "max_norm/layer16": 27.171628952026367, "max_norm/layer17": 32.492279052734375, "max_norm/layer18": 28.64808464050293, "max_norm/layer19": 28.095623016357422, "max_norm/layer2": 21.42145347595215, "max_norm/layer20": 28.951364517211914, "max_norm/layer21": 28.559009552001953, "max_norm/layer22": 29.44493865966797, "max_norm/layer23": 28.142528533935547, "max_norm/layer3": 26.364864349365234, "max_norm/layer4": 26.138946533203125, "max_norm/layer5": 33.330360412597656, "max_norm/layer6": 22.253427505493164, "max_norm/layer7": 28.289306640625, "max_norm/layer8": 28.16522789001465, "max_norm/layer9": 27.91402244567871, "mean_norm": 10.707975409924984, "mean_norm/layer0": 10.30594515800476, "mean_norm/layer1": 10.188912451267242, "mean_norm/layer10": 10.544912993907928, "mean_norm/layer11": 10.851902425289154, "mean_norm/layer12": 11.379847884178162, "mean_norm/layer13": 10.534163355827332, "mean_norm/layer14": 10.918485581874847, "mean_norm/layer15": 11.239793062210083, "mean_norm/layer16": 10.619805216789246, "mean_norm/layer17": 11.103209257125854, "mean_norm/layer18": 10.657873153686523, "mean_norm/layer19": 10.705002188682556, "mean_norm/layer2": 8.860992550849915, "mean_norm/layer20": 10.81546437740326, "mean_norm/layer21": 10.773070752620697, "mean_norm/layer22": 11.740694344043732, "mean_norm/layer23": 11.686245620250702, "mean_norm/layer3": 11.157555222511292, "mean_norm/layer4": 10.006467998027802, "mean_norm/layer5": 12.33630108833313, "mean_norm/layer6": 9.53725254535675, "mean_norm/layer7": 10.04867398738861, "mean_norm/layer8": 10.52416044473648, "mean_norm/layer9": 10.454678177833557, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9600 }, { "epoch": 4.01, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46611747240846424, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.72489857673645, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5754, "eval_samples_per_second": 20.82, "eval_steps_per_second": 0.691, "step": 9600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.03, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3794, "max_norm": 33.43217468261719, "max_norm/layer0": 25.877573013305664, "max_norm/layer1": 27.117990493774414, "max_norm/layer10": 28.741506576538086, "max_norm/layer11": 26.964374542236328, "max_norm/layer12": 29.798730850219727, "max_norm/layer13": 25.944913864135742, "max_norm/layer14": 27.508432388305664, "max_norm/layer15": 32.604679107666016, "max_norm/layer16": 27.249217987060547, "max_norm/layer17": 32.60658645629883, "max_norm/layer18": 28.736671447753906, "max_norm/layer19": 28.200363159179688, "max_norm/layer2": 21.477174758911133, "max_norm/layer20": 29.063146591186523, "max_norm/layer21": 28.660245895385742, "max_norm/layer22": 29.5419979095459, "max_norm/layer23": 28.22159767150879, "max_norm/layer3": 26.45147705078125, "max_norm/layer4": 26.22504425048828, "max_norm/layer5": 33.43217468261719, "max_norm/layer6": 22.306541442871094, "max_norm/layer7": 28.394588470458984, "max_norm/layer8": 28.237964630126953, "max_norm/layer9": 28.015945434570312, "mean_norm": 10.718371979892254, "mean_norm/layer0": 10.31786572933197, "mean_norm/layer1": 10.19822359085083, "mean_norm/layer10": 10.554284036159515, "mean_norm/layer11": 10.862599432468414, "mean_norm/layer12": 11.393266081809998, "mean_norm/layer13": 10.544181823730469, "mean_norm/layer14": 10.929447948932648, "mean_norm/layer15": 11.252337992191315, "mean_norm/layer16": 10.629814624786377, "mean_norm/layer17": 11.114417672157288, "mean_norm/layer18": 10.667439937591553, "mean_norm/layer19": 10.715016543865204, "mean_norm/layer2": 8.864496111869812, "mean_norm/layer20": 10.825547099113464, "mean_norm/layer21": 10.783361256122589, "mean_norm/layer22": 11.753725469112396, "mean_norm/layer23": 11.699581742286682, "mean_norm/layer3": 11.170176565647125, "mean_norm/layer4": 10.014464855194092, "mean_norm/layer5": 12.353192925453186, "mean_norm/layer6": 9.543238639831543, "mean_norm/layer7": 10.056542873382568, "mean_norm/layer8": 10.533743023872375, "mean_norm/layer9": 10.46396154165268, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9650 }, { "epoch": 4.03, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4661945380724661, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7255403995513916, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8304, "eval_samples_per_second": 20.371, "eval_steps_per_second": 0.676, "step": 9650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.05, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4052, "max_norm": 33.544166564941406, "max_norm/layer0": 25.971208572387695, "max_norm/layer1": 27.212482452392578, "max_norm/layer10": 28.805835723876953, "max_norm/layer11": 27.037063598632812, "max_norm/layer12": 29.901081085205078, "max_norm/layer13": 26.061325073242188, "max_norm/layer14": 27.592479705810547, "max_norm/layer15": 32.70225143432617, "max_norm/layer16": 27.345638275146484, "max_norm/layer17": 32.72298812866211, "max_norm/layer18": 28.8302059173584, "max_norm/layer19": 28.301692962646484, "max_norm/layer2": 21.534664154052734, "max_norm/layer20": 29.158594131469727, "max_norm/layer21": 28.769094467163086, "max_norm/layer22": 29.628246307373047, "max_norm/layer23": 28.29683494567871, "max_norm/layer3": 26.550901412963867, "max_norm/layer4": 26.31060791015625, "max_norm/layer5": 33.544166564941406, "max_norm/layer6": 22.365896224975586, "max_norm/layer7": 28.48600959777832, "max_norm/layer8": 28.317893981933594, "max_norm/layer9": 28.098060607910156, "mean_norm": 10.72877743591865, "mean_norm/layer0": 10.33024138212204, "mean_norm/layer1": 10.20755660533905, "mean_norm/layer10": 10.56365418434143, "mean_norm/layer11": 10.873272597789764, "mean_norm/layer12": 11.406682074069977, "mean_norm/layer13": 10.554228723049164, "mean_norm/layer14": 10.94050520658493, "mean_norm/layer15": 11.2648805975914, "mean_norm/layer16": 10.639814674854279, "mean_norm/layer17": 11.125602781772614, "mean_norm/layer18": 10.67691570520401, "mean_norm/layer19": 10.724987506866455, "mean_norm/layer2": 8.8680060505867, "mean_norm/layer20": 10.835620880126953, "mean_norm/layer21": 10.793499529361725, "mean_norm/layer22": 11.766671538352966, "mean_norm/layer23": 11.71286165714264, "mean_norm/layer3": 11.1830073595047, "mean_norm/layer4": 10.02237868309021, "mean_norm/layer5": 12.3701092004776, "mean_norm/layer6": 9.549232542514801, "mean_norm/layer7": 10.064398467540741, "mean_norm/layer8": 10.54334545135498, "mean_norm/layer9": 10.473185062408447, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9700 }, { "epoch": 4.05, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46593089237982827, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7316884994506836, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8212, "eval_samples_per_second": 20.387, "eval_steps_per_second": 0.677, "step": 9700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.07, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4048, "max_norm": 33.6557731628418, "max_norm/layer0": 26.066650390625, "max_norm/layer1": 27.306856155395508, "max_norm/layer10": 28.87506675720215, "max_norm/layer11": 27.117992401123047, "max_norm/layer12": 30.010032653808594, "max_norm/layer13": 26.163286209106445, "max_norm/layer14": 27.68418312072754, "max_norm/layer15": 32.824462890625, "max_norm/layer16": 27.442707061767578, "max_norm/layer17": 32.84294128417969, "max_norm/layer18": 28.918869018554688, "max_norm/layer19": 28.40460205078125, "max_norm/layer2": 21.58877182006836, "max_norm/layer20": 29.261137008666992, "max_norm/layer21": 28.882108688354492, "max_norm/layer22": 29.714868545532227, "max_norm/layer23": 28.384431838989258, "max_norm/layer3": 26.648792266845703, "max_norm/layer4": 26.3952693939209, "max_norm/layer5": 33.6557731628418, "max_norm/layer6": 22.42438316345215, "max_norm/layer7": 28.574481964111328, "max_norm/layer8": 28.396562576293945, "max_norm/layer9": 28.194005966186523, "mean_norm": 10.739245263238749, "mean_norm/layer0": 10.34294319152832, "mean_norm/layer1": 10.216990768909454, "mean_norm/layer10": 10.573124587535858, "mean_norm/layer11": 10.884048283100128, "mean_norm/layer12": 11.420178711414337, "mean_norm/layer13": 10.56421959400177, "mean_norm/layer14": 10.95153260231018, "mean_norm/layer15": 11.277423799037933, "mean_norm/layer16": 10.649728536605835, "mean_norm/layer17": 11.136787831783295, "mean_norm/layer18": 10.686513543128967, "mean_norm/layer19": 10.735000014305115, "mean_norm/layer2": 8.871544182300568, "mean_norm/layer20": 10.845619082450867, "mean_norm/layer21": 10.803569555282593, "mean_norm/layer22": 11.779800772666931, "mean_norm/layer23": 11.72627604007721, "mean_norm/layer3": 11.19598013162613, "mean_norm/layer4": 10.030231535434723, "mean_norm/layer5": 12.387197315692902, "mean_norm/layer6": 9.555224657058716, "mean_norm/layer7": 10.072312891483307, "mean_norm/layer8": 10.552999079227448, "mean_norm/layer9": 10.482639610767365, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9750 }, { "epoch": 4.07, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4651399553019149, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.731163501739502, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6326, "eval_samples_per_second": 20.718, "eval_steps_per_second": 0.688, "step": 9750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.09, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.431, "max_norm": 33.754417419433594, "max_norm/layer0": 26.159645080566406, "max_norm/layer1": 27.404632568359375, "max_norm/layer10": 28.946714401245117, "max_norm/layer11": 27.202007293701172, "max_norm/layer12": 30.121065139770508, "max_norm/layer13": 26.25760841369629, "max_norm/layer14": 27.78693389892578, "max_norm/layer15": 32.94147872924805, "max_norm/layer16": 27.53252601623535, "max_norm/layer17": 32.94584274291992, "max_norm/layer18": 29.010591506958008, "max_norm/layer19": 28.501497268676758, "max_norm/layer2": 21.647987365722656, "max_norm/layer20": 29.359277725219727, "max_norm/layer21": 28.98589515686035, "max_norm/layer22": 29.815181732177734, "max_norm/layer23": 28.46575927734375, "max_norm/layer3": 26.744037628173828, "max_norm/layer4": 26.49158477783203, "max_norm/layer5": 33.754417419433594, "max_norm/layer6": 22.48211097717285, "max_norm/layer7": 28.680606842041016, "max_norm/layer8": 28.470558166503906, "max_norm/layer9": 28.30710220336914, "mean_norm": 10.749750765661398, "mean_norm/layer0": 10.355877697467804, "mean_norm/layer1": 10.226464807987213, "mean_norm/layer10": 10.582582950592041, "mean_norm/layer11": 10.894802331924438, "mean_norm/layer12": 11.433715283870697, "mean_norm/layer13": 10.574375629425049, "mean_norm/layer14": 10.96265333890915, "mean_norm/layer15": 11.29006689786911, "mean_norm/layer16": 10.659694969654083, "mean_norm/layer17": 11.147985517978668, "mean_norm/layer18": 10.696076333522797, "mean_norm/layer19": 10.744998633861542, "mean_norm/layer2": 8.87516975402832, "mean_norm/layer20": 10.855427503585815, "mean_norm/layer21": 10.813684225082397, "mean_norm/layer22": 11.792862176895142, "mean_norm/layer23": 11.739510834217072, "mean_norm/layer3": 11.209203958511353, "mean_norm/layer4": 10.038220882415771, "mean_norm/layer5": 12.404386818408966, "mean_norm/layer6": 9.561310589313507, "mean_norm/layer7": 10.080223083496094, "mean_norm/layer8": 10.56266450881958, "mean_norm/layer9": 10.492059648036957, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9800 }, { "epoch": 4.09, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4648844217844352, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.733736276626587, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8593, "eval_samples_per_second": 20.322, "eval_steps_per_second": 0.675, "step": 9800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.11, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4228, "max_norm": 33.861244201660156, "max_norm/layer0": 26.24639320373535, "max_norm/layer1": 27.48942756652832, "max_norm/layer10": 29.03034019470215, "max_norm/layer11": 27.291231155395508, "max_norm/layer12": 30.230600357055664, "max_norm/layer13": 26.365447998046875, "max_norm/layer14": 27.9014835357666, "max_norm/layer15": 33.083675384521484, "max_norm/layer16": 27.63498878479004, "max_norm/layer17": 33.05691909790039, "max_norm/layer18": 29.120906829833984, "max_norm/layer19": 28.622779846191406, "max_norm/layer2": 21.700437545776367, "max_norm/layer20": 29.4544734954834, "max_norm/layer21": 29.081451416015625, "max_norm/layer22": 29.90110206604004, "max_norm/layer23": 28.563703536987305, "max_norm/layer3": 26.82892417907715, "max_norm/layer4": 26.564434051513672, "max_norm/layer5": 33.861244201660156, "max_norm/layer6": 22.549427032470703, "max_norm/layer7": 28.77765655517578, "max_norm/layer8": 28.5548152923584, "max_norm/layer9": 28.40509605407715, "mean_norm": 10.760287982722124, "mean_norm/layer0": 10.368937730789185, "mean_norm/layer1": 10.236066102981567, "mean_norm/layer10": 10.592142224311829, "mean_norm/layer11": 10.905653715133667, "mean_norm/layer12": 11.44727337360382, "mean_norm/layer13": 10.584530711174011, "mean_norm/layer14": 10.973800659179688, "mean_norm/layer15": 11.30276346206665, "mean_norm/layer16": 10.669570624828339, "mean_norm/layer17": 11.159093022346497, "mean_norm/layer18": 10.705552816390991, "mean_norm/layer19": 10.755048036575317, "mean_norm/layer2": 8.878891050815582, "mean_norm/layer20": 10.865257143974304, "mean_norm/layer21": 10.82360953092575, "mean_norm/layer22": 11.805942714214325, "mean_norm/layer23": 11.752815186977386, "mean_norm/layer3": 11.2224680185318, "mean_norm/layer4": 10.046254456043243, "mean_norm/layer5": 12.421765625476837, "mean_norm/layer6": 9.567421734333038, "mean_norm/layer7": 10.08821588754654, "mean_norm/layer8": 10.572381436824799, "mean_norm/layer9": 10.501456320285797, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9850 }, { "epoch": 4.11, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46495743136085793, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.736454963684082, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6254, "eval_samples_per_second": 20.731, "eval_steps_per_second": 0.688, "step": 9850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.13, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4248, "max_norm": 33.9556770324707, "max_norm/layer0": 26.33261489868164, "max_norm/layer1": 27.56793785095215, "max_norm/layer10": 29.119720458984375, "max_norm/layer11": 27.357046127319336, "max_norm/layer12": 30.328794479370117, "max_norm/layer13": 26.464094161987305, "max_norm/layer14": 28.015090942382812, "max_norm/layer15": 33.20350646972656, "max_norm/layer16": 27.721712112426758, "max_norm/layer17": 33.16472244262695, "max_norm/layer18": 29.199329376220703, "max_norm/layer19": 28.717470169067383, "max_norm/layer2": 21.774988174438477, "max_norm/layer20": 29.529516220092773, "max_norm/layer21": 29.168851852416992, "max_norm/layer22": 29.998376846313477, "max_norm/layer23": 28.664161682128906, "max_norm/layer3": 26.9122371673584, "max_norm/layer4": 26.651660919189453, "max_norm/layer5": 33.9556770324707, "max_norm/layer6": 22.61054801940918, "max_norm/layer7": 28.86550521850586, "max_norm/layer8": 28.6397705078125, "max_norm/layer9": 28.507871627807617, "mean_norm": 10.770872302353382, "mean_norm/layer0": 10.382256388664246, "mean_norm/layer1": 10.245670199394226, "mean_norm/layer10": 10.601735293865204, "mean_norm/layer11": 10.916560173034668, "mean_norm/layer12": 11.46084600687027, "mean_norm/layer13": 10.594715774059296, "mean_norm/layer14": 10.984999299049377, "mean_norm/layer15": 11.315381169319153, "mean_norm/layer16": 10.679502785205841, "mean_norm/layer17": 11.17024689912796, "mean_norm/layer18": 10.714980006217957, "mean_norm/layer19": 10.764934778213501, "mean_norm/layer2": 8.882648348808289, "mean_norm/layer20": 10.875350773334503, "mean_norm/layer21": 10.833550810813904, "mean_norm/layer22": 11.81899881362915, "mean_norm/layer23": 11.766067922115326, "mean_norm/layer3": 11.235760807991028, "mean_norm/layer4": 10.05432653427124, "mean_norm/layer5": 12.439239859580994, "mean_norm/layer6": 9.573659777641296, "mean_norm/layer7": 10.096255362033844, "mean_norm/layer8": 10.582192361354828, "mean_norm/layer9": 10.51105511188507, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9900 }, { "epoch": 4.13, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4645396543402165, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7372591495513916, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6883, "eval_samples_per_second": 20.619, "eval_steps_per_second": 0.684, "step": 9900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.15, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4436, "max_norm": 34.049339294433594, "max_norm/layer0": 26.419641494750977, "max_norm/layer1": 27.664649963378906, "max_norm/layer10": 29.210588455200195, "max_norm/layer11": 27.431074142456055, "max_norm/layer12": 30.43071937561035, "max_norm/layer13": 26.566423416137695, "max_norm/layer14": 28.112030029296875, "max_norm/layer15": 33.33354187011719, "max_norm/layer16": 27.804418563842773, "max_norm/layer17": 33.27605438232422, "max_norm/layer18": 29.307640075683594, "max_norm/layer19": 28.8117733001709, "max_norm/layer2": 21.834720611572266, "max_norm/layer20": 29.619890213012695, "max_norm/layer21": 29.266197204589844, "max_norm/layer22": 30.08498764038086, "max_norm/layer23": 28.764848709106445, "max_norm/layer3": 26.997285842895508, "max_norm/layer4": 26.735742568969727, "max_norm/layer5": 34.049339294433594, "max_norm/layer6": 22.67427635192871, "max_norm/layer7": 28.954214096069336, "max_norm/layer8": 28.72142791748047, "max_norm/layer9": 28.615943908691406, "mean_norm": 10.781430753568808, "mean_norm/layer0": 10.395660698413849, "mean_norm/layer1": 10.255378246307373, "mean_norm/layer10": 10.61120194196701, "mean_norm/layer11": 10.9274360537529, "mean_norm/layer12": 11.474487781524658, "mean_norm/layer13": 10.604840219020844, "mean_norm/layer14": 10.996111154556274, "mean_norm/layer15": 11.328039467334747, "mean_norm/layer16": 10.689521372318268, "mean_norm/layer17": 11.181367576122284, "mean_norm/layer18": 10.724294066429138, "mean_norm/layer19": 10.774694919586182, "mean_norm/layer2": 8.886360824108124, "mean_norm/layer20": 10.885128438472748, "mean_norm/layer21": 10.843543469905853, "mean_norm/layer22": 11.83205932378769, "mean_norm/layer23": 11.779264986515045, "mean_norm/layer3": 11.249089777469635, "mean_norm/layer4": 10.062511086463928, "mean_norm/layer5": 12.456778228282928, "mean_norm/layer6": 9.579894959926605, "mean_norm/layer7": 10.104304015636444, "mean_norm/layer8": 10.59186977148056, "mean_norm/layer9": 10.52049970626831, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 9950 }, { "epoch": 4.15, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4647992439452753, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7321929931640625, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5663, "eval_samples_per_second": 20.836, "eval_steps_per_second": 0.692, "step": 9950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.18, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4491, "max_norm": 34.14283752441406, "max_norm/layer0": 26.50551986694336, "max_norm/layer1": 27.7550106048584, "max_norm/layer10": 29.307462692260742, "max_norm/layer11": 27.49453353881836, "max_norm/layer12": 30.52471160888672, "max_norm/layer13": 26.660375595092773, "max_norm/layer14": 28.200090408325195, "max_norm/layer15": 33.45909881591797, "max_norm/layer16": 27.896703720092773, "max_norm/layer17": 33.38733673095703, "max_norm/layer18": 29.413230895996094, "max_norm/layer19": 28.905559539794922, "max_norm/layer2": 21.893877029418945, "max_norm/layer20": 29.715972900390625, "max_norm/layer21": 29.35295867919922, "max_norm/layer22": 30.175220489501953, "max_norm/layer23": 28.85986328125, "max_norm/layer3": 27.073829650878906, "max_norm/layer4": 26.81964683532715, "max_norm/layer5": 34.14283752441406, "max_norm/layer6": 22.7307071685791, "max_norm/layer7": 29.045549392700195, "max_norm/layer8": 28.79771614074707, "max_norm/layer9": 28.713727951049805, "mean_norm": 10.791931385795275, "mean_norm/layer0": 10.409155309200287, "mean_norm/layer1": 10.2649627327919, "mean_norm/layer10": 10.620647609233856, "mean_norm/layer11": 10.938298046588898, "mean_norm/layer12": 11.488030791282654, "mean_norm/layer13": 10.61491984128952, "mean_norm/layer14": 11.007142424583435, "mean_norm/layer15": 11.340634763240814, "mean_norm/layer16": 10.699385046958923, "mean_norm/layer17": 11.192373037338257, "mean_norm/layer18": 10.733623325824738, "mean_norm/layer19": 10.784404814243317, "mean_norm/layer2": 8.890056729316711, "mean_norm/layer20": 10.89472770690918, "mean_norm/layer21": 10.853393316268921, "mean_norm/layer22": 11.845016062259674, "mean_norm/layer23": 11.792450189590454, "mean_norm/layer3": 11.262365102767944, "mean_norm/layer4": 10.070643126964569, "mean_norm/layer5": 12.47421932220459, "mean_norm/layer6": 9.5861154794693, "mean_norm/layer7": 10.112246751785278, "mean_norm/layer8": 10.601553738117218, "mean_norm/layer9": 10.52998799085617, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10000 }, { "epoch": 4.18, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46464105652969256, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7348339557647705, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8228, "eval_samples_per_second": 20.384, "eval_steps_per_second": 0.677, "step": 10000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.2, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4329, "max_norm": 34.24258041381836, "max_norm/layer0": 26.59330177307129, "max_norm/layer1": 27.850889205932617, "max_norm/layer10": 29.392183303833008, "max_norm/layer11": 27.56389808654785, "max_norm/layer12": 30.620975494384766, "max_norm/layer13": 26.739151000976562, "max_norm/layer14": 28.295047760009766, "max_norm/layer15": 33.56934356689453, "max_norm/layer16": 27.998239517211914, "max_norm/layer17": 33.505916595458984, "max_norm/layer18": 29.517406463623047, "max_norm/layer19": 29.00499725341797, "max_norm/layer2": 21.960556030273438, "max_norm/layer20": 29.809242248535156, "max_norm/layer21": 29.433250427246094, "max_norm/layer22": 30.258737564086914, "max_norm/layer23": 28.964088439941406, "max_norm/layer3": 27.16298484802246, "max_norm/layer4": 26.908559799194336, "max_norm/layer5": 34.24258041381836, "max_norm/layer6": 22.788379669189453, "max_norm/layer7": 29.131332397460938, "max_norm/layer8": 28.89280128479004, "max_norm/layer9": 28.82826042175293, "mean_norm": 10.802442769209543, "mean_norm/layer0": 10.422712087631226, "mean_norm/layer1": 10.274647951126099, "mean_norm/layer10": 10.630156993865967, "mean_norm/layer11": 10.949021577835083, "mean_norm/layer12": 11.501543462276459, "mean_norm/layer13": 10.62501984834671, "mean_norm/layer14": 11.018203675746918, "mean_norm/layer15": 11.353238582611084, "mean_norm/layer16": 10.70931327342987, "mean_norm/layer17": 11.203383982181549, "mean_norm/layer18": 10.742836117744446, "mean_norm/layer19": 10.79411780834198, "mean_norm/layer2": 8.89378023147583, "mean_norm/layer20": 10.904330492019653, "mean_norm/layer21": 10.863244533538818, "mean_norm/layer22": 11.858083486557007, "mean_norm/layer23": 11.805590689182281, "mean_norm/layer3": 11.275679171085358, "mean_norm/layer4": 10.078687965869904, "mean_norm/layer5": 12.491709351539612, "mean_norm/layer6": 9.592344641685486, "mean_norm/layer7": 10.120253562927246, "mean_norm/layer8": 10.611266136169434, "mean_norm/layer9": 10.539460837841034, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10050 }, { "epoch": 4.2, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4653305914181299, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7377023696899414, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8222, "eval_samples_per_second": 20.385, "eval_steps_per_second": 0.677, "step": 10050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.22, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4418, "max_norm": 34.33783721923828, "max_norm/layer0": 26.687532424926758, "max_norm/layer1": 27.943302154541016, "max_norm/layer10": 29.47475814819336, "max_norm/layer11": 27.646385192871094, "max_norm/layer12": 30.71775245666504, "max_norm/layer13": 26.815946578979492, "max_norm/layer14": 28.3834228515625, "max_norm/layer15": 33.6978874206543, "max_norm/layer16": 28.076602935791016, "max_norm/layer17": 33.623817443847656, "max_norm/layer18": 29.62516975402832, "max_norm/layer19": 29.10083770751953, "max_norm/layer2": 22.04039192199707, "max_norm/layer20": 29.9028377532959, "max_norm/layer21": 29.55206871032715, "max_norm/layer22": 30.35678482055664, "max_norm/layer23": 29.040468215942383, "max_norm/layer3": 27.252946853637695, "max_norm/layer4": 26.981002807617188, "max_norm/layer5": 34.33783721923828, "max_norm/layer6": 22.85585594177246, "max_norm/layer7": 29.2227840423584, "max_norm/layer8": 28.991825103759766, "max_norm/layer9": 28.919313430786133, "mean_norm": 10.813075611988703, "mean_norm/layer0": 10.436362564563751, "mean_norm/layer1": 10.284512996673584, "mean_norm/layer10": 10.639845430850983, "mean_norm/layer11": 10.960028350353241, "mean_norm/layer12": 11.515252709388733, "mean_norm/layer13": 10.635209619998932, "mean_norm/layer14": 11.029352128505707, "mean_norm/layer15": 11.365962743759155, "mean_norm/layer16": 10.71934300661087, "mean_norm/layer17": 11.21452122926712, "mean_norm/layer18": 10.75224620103836, "mean_norm/layer19": 10.80382651090622, "mean_norm/layer2": 8.897547483444214, "mean_norm/layer20": 10.914192497730255, "mean_norm/layer21": 10.873103141784668, "mean_norm/layer22": 11.871187806129456, "mean_norm/layer23": 11.81886202096939, "mean_norm/layer3": 11.289128601551056, "mean_norm/layer4": 10.086705446243286, "mean_norm/layer5": 12.509444057941437, "mean_norm/layer6": 9.598621368408203, "mean_norm/layer7": 10.128449976444244, "mean_norm/layer8": 10.621142864227295, "mean_norm/layer9": 10.54896593093872, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10100 }, { "epoch": 4.22, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46528597445476044, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7357242107391357, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6332, "eval_samples_per_second": 20.716, "eval_steps_per_second": 0.688, "step": 10100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.24, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4544, "max_norm": 34.453956604003906, "max_norm/layer0": 26.772411346435547, "max_norm/layer1": 28.041337966918945, "max_norm/layer10": 29.558502197265625, "max_norm/layer11": 27.715511322021484, "max_norm/layer12": 30.828214645385742, "max_norm/layer13": 26.886316299438477, "max_norm/layer14": 28.47247886657715, "max_norm/layer15": 33.815494537353516, "max_norm/layer16": 28.156137466430664, "max_norm/layer17": 33.7318115234375, "max_norm/layer18": 29.730388641357422, "max_norm/layer19": 29.191200256347656, "max_norm/layer2": 22.100492477416992, "max_norm/layer20": 29.983238220214844, "max_norm/layer21": 29.642305374145508, "max_norm/layer22": 30.443191528320312, "max_norm/layer23": 29.122554779052734, "max_norm/layer3": 27.341691970825195, "max_norm/layer4": 27.058629989624023, "max_norm/layer5": 34.453956604003906, "max_norm/layer6": 22.911787033081055, "max_norm/layer7": 29.31786346435547, "max_norm/layer8": 29.09516143798828, "max_norm/layer9": 29.001785278320312, "mean_norm": 10.823577101031939, "mean_norm/layer0": 10.449947893619537, "mean_norm/layer1": 10.294241428375244, "mean_norm/layer10": 10.649329900741577, "mean_norm/layer11": 10.97073119878769, "mean_norm/layer12": 11.528786540031433, "mean_norm/layer13": 10.64515471458435, "mean_norm/layer14": 11.040421605110168, "mean_norm/layer15": 11.378489017486572, "mean_norm/layer16": 10.729291319847107, "mean_norm/layer17": 11.22548794746399, "mean_norm/layer18": 10.761508107185364, "mean_norm/layer19": 10.813477575778961, "mean_norm/layer2": 8.90120553970337, "mean_norm/layer20": 10.923896491527557, "mean_norm/layer21": 10.882788181304932, "mean_norm/layer22": 11.884176313877106, "mean_norm/layer23": 11.831968367099762, "mean_norm/layer3": 11.302320063114166, "mean_norm/layer4": 10.094793438911438, "mean_norm/layer5": 12.52708524465561, "mean_norm/layer6": 9.604782938957214, "mean_norm/layer7": 10.136550486087799, "mean_norm/layer8": 10.630961179733276, "mean_norm/layer9": 10.558454930782318, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10150 }, { "epoch": 4.24, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46512778703917773, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7335257530212402, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8291, "eval_samples_per_second": 20.374, "eval_steps_per_second": 0.676, "step": 10150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.26, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4673, "max_norm": 34.58348083496094, "max_norm/layer0": 26.855865478515625, "max_norm/layer1": 28.143543243408203, "max_norm/layer10": 29.672481536865234, "max_norm/layer11": 27.77507781982422, "max_norm/layer12": 30.940479278564453, "max_norm/layer13": 26.968402862548828, "max_norm/layer14": 28.5567684173584, "max_norm/layer15": 33.94534683227539, "max_norm/layer16": 28.248029708862305, "max_norm/layer17": 33.84120559692383, "max_norm/layer18": 29.839115142822266, "max_norm/layer19": 29.27945899963379, "max_norm/layer2": 22.152008056640625, "max_norm/layer20": 30.0822811126709, "max_norm/layer21": 29.724666595458984, "max_norm/layer22": 30.52536392211914, "max_norm/layer23": 29.206314086914062, "max_norm/layer3": 27.427833557128906, "max_norm/layer4": 27.152973175048828, "max_norm/layer5": 34.58348083496094, "max_norm/layer6": 22.977237701416016, "max_norm/layer7": 29.407623291015625, "max_norm/layer8": 29.18715476989746, "max_norm/layer9": 29.0870418548584, "mean_norm": 10.833997232218584, "mean_norm/layer0": 10.463428616523743, "mean_norm/layer1": 10.30388629436493, "mean_norm/layer10": 10.658759415149689, "mean_norm/layer11": 10.981380045413971, "mean_norm/layer12": 11.542144119739532, "mean_norm/layer13": 10.655113756656647, "mean_norm/layer14": 11.05135828256607, "mean_norm/layer15": 11.390934586524963, "mean_norm/layer16": 10.739136815071106, "mean_norm/layer17": 11.236359000205994, "mean_norm/layer18": 10.770753979682922, "mean_norm/layer19": 10.822953343391418, "mean_norm/layer2": 8.904917061328888, "mean_norm/layer20": 10.933463454246521, "mean_norm/layer21": 10.89233547449112, "mean_norm/layer22": 11.897063732147217, "mean_norm/layer23": 11.84492552280426, "mean_norm/layer3": 11.315583348274231, "mean_norm/layer4": 10.102841198444366, "mean_norm/layer5": 12.544600367546082, "mean_norm/layer6": 9.610954105854034, "mean_norm/layer7": 10.144558072090149, "mean_norm/layer8": 10.64060389995575, "mean_norm/layer9": 10.5678790807724, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10200 }, { "epoch": 4.26, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4655739566728725, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7333078384399414, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8316, "eval_samples_per_second": 20.369, "eval_steps_per_second": 0.676, "step": 10200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.28, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4621, "max_norm": 34.71388626098633, "max_norm/layer0": 26.937944412231445, "max_norm/layer1": 28.25180435180664, "max_norm/layer10": 29.777528762817383, "max_norm/layer11": 27.845121383666992, "max_norm/layer12": 31.053159713745117, "max_norm/layer13": 27.057754516601562, "max_norm/layer14": 28.657506942749023, "max_norm/layer15": 34.0597038269043, "max_norm/layer16": 28.338624954223633, "max_norm/layer17": 33.95635986328125, "max_norm/layer18": 29.946928024291992, "max_norm/layer19": 29.373924255371094, "max_norm/layer2": 22.206056594848633, "max_norm/layer20": 30.173419952392578, "max_norm/layer21": 29.83626937866211, "max_norm/layer22": 30.619873046875, "max_norm/layer23": 29.289323806762695, "max_norm/layer3": 27.5142822265625, "max_norm/layer4": 27.233551025390625, "max_norm/layer5": 34.71388626098633, "max_norm/layer6": 23.036663055419922, "max_norm/layer7": 29.503074645996094, "max_norm/layer8": 29.276399612426758, "max_norm/layer9": 29.16158676147461, "mean_norm": 10.844474345445633, "mean_norm/layer0": 10.477041006088257, "mean_norm/layer1": 10.313621699810028, "mean_norm/layer10": 10.668282330036163, "mean_norm/layer11": 10.992021024227142, "mean_norm/layer12": 11.555621325969696, "mean_norm/layer13": 10.665147244930267, "mean_norm/layer14": 11.062337279319763, "mean_norm/layer15": 11.403449833393097, "mean_norm/layer16": 10.74899560213089, "mean_norm/layer17": 11.247314095497131, "mean_norm/layer18": 10.77999460697174, "mean_norm/layer19": 10.832535803318024, "mean_norm/layer2": 8.908604800701141, "mean_norm/layer20": 10.942877173423767, "mean_norm/layer21": 10.901946604251862, "mean_norm/layer22": 11.90995740890503, "mean_norm/layer23": 11.857899725437164, "mean_norm/layer3": 11.328973352909088, "mean_norm/layer4": 10.11098599433899, "mean_norm/layer5": 12.562341749668121, "mean_norm/layer6": 9.61716765165329, "mean_norm/layer7": 10.1526557803154, "mean_norm/layer8": 10.65031635761261, "mean_norm/layer9": 10.57729583978653, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10250 }, { "epoch": 4.28, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.466563642042159, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7261102199554443, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6164, "eval_samples_per_second": 20.747, "eval_steps_per_second": 0.689, "step": 10250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.3, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4588, "max_norm": 34.85292434692383, "max_norm/layer0": 27.01976203918457, "max_norm/layer1": 28.348358154296875, "max_norm/layer10": 29.854251861572266, "max_norm/layer11": 27.921520233154297, "max_norm/layer12": 31.167068481445312, "max_norm/layer13": 27.163440704345703, "max_norm/layer14": 28.76555061340332, "max_norm/layer15": 34.19651412963867, "max_norm/layer16": 28.430654525756836, "max_norm/layer17": 34.0618782043457, "max_norm/layer18": 30.038536071777344, "max_norm/layer19": 29.47166633605957, "max_norm/layer2": 22.28195571899414, "max_norm/layer20": 30.264249801635742, "max_norm/layer21": 29.946247100830078, "max_norm/layer22": 30.70496368408203, "max_norm/layer23": 29.37714195251465, "max_norm/layer3": 27.59646224975586, "max_norm/layer4": 27.327890396118164, "max_norm/layer5": 34.85292434692383, "max_norm/layer6": 23.106088638305664, "max_norm/layer7": 29.593017578125, "max_norm/layer8": 29.365062713623047, "max_norm/layer9": 29.251405715942383, "mean_norm": 10.855059415102005, "mean_norm/layer0": 10.490851998329163, "mean_norm/layer1": 10.323559045791626, "mean_norm/layer10": 10.677920937538147, "mean_norm/layer11": 11.002786934375763, "mean_norm/layer12": 11.569205522537231, "mean_norm/layer13": 10.675206542015076, "mean_norm/layer14": 11.073414862155914, "mean_norm/layer15": 11.416033565998077, "mean_norm/layer16": 10.759003520011902, "mean_norm/layer17": 11.258389592170715, "mean_norm/layer18": 10.789301872253418, "mean_norm/layer19": 10.842225074768066, "mean_norm/layer2": 8.912357330322266, "mean_norm/layer20": 10.952302515506744, "mean_norm/layer21": 10.911858797073364, "mean_norm/layer22": 11.92295503616333, "mean_norm/layer23": 11.870939314365387, "mean_norm/layer3": 11.342563092708588, "mean_norm/layer4": 10.119135022163391, "mean_norm/layer5": 12.580202519893646, "mean_norm/layer6": 9.623411118984222, "mean_norm/layer7": 10.160789787769318, "mean_norm/layer8": 10.660134971141815, "mean_norm/layer9": 10.58687698841095, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10300 }, { "epoch": 4.3, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4662594354737307, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7252895832061768, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.611, "eval_samples_per_second": 20.756, "eval_steps_per_second": 0.689, "step": 10300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.32, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4687, "max_norm": 34.978092193603516, "max_norm/layer0": 27.09325408935547, "max_norm/layer1": 28.446916580200195, "max_norm/layer10": 29.938980102539062, "max_norm/layer11": 27.996728897094727, "max_norm/layer12": 31.258825302124023, "max_norm/layer13": 27.261137008666992, "max_norm/layer14": 28.864126205444336, "max_norm/layer15": 34.30337905883789, "max_norm/layer16": 28.527667999267578, "max_norm/layer17": 34.16838455200195, "max_norm/layer18": 30.128267288208008, "max_norm/layer19": 29.572622299194336, "max_norm/layer2": 22.346477508544922, "max_norm/layer20": 30.36367416381836, "max_norm/layer21": 30.041337966918945, "max_norm/layer22": 30.79248809814453, "max_norm/layer23": 29.450716018676758, "max_norm/layer3": 27.676977157592773, "max_norm/layer4": 27.40702247619629, "max_norm/layer5": 34.978092193603516, "max_norm/layer6": 23.169605255126953, "max_norm/layer7": 29.688037872314453, "max_norm/layer8": 29.44434928894043, "max_norm/layer9": 29.350614547729492, "mean_norm": 10.865495984752974, "mean_norm/layer0": 10.50440114736557, "mean_norm/layer1": 10.333391070365906, "mean_norm/layer10": 10.68735784292221, "mean_norm/layer11": 11.013559699058533, "mean_norm/layer12": 11.582540392875671, "mean_norm/layer13": 10.6851087808609, "mean_norm/layer14": 11.084410846233368, "mean_norm/layer15": 11.428485333919525, "mean_norm/layer16": 10.768832564353943, "mean_norm/layer17": 11.269369840621948, "mean_norm/layer18": 10.798486649990082, "mean_norm/layer19": 10.851684868335724, "mean_norm/layer2": 8.916000783443451, "mean_norm/layer20": 10.961656332015991, "mean_norm/layer21": 10.921466648578644, "mean_norm/layer22": 11.935903191566467, "mean_norm/layer23": 11.883876979351044, "mean_norm/layer3": 11.355989933013916, "mean_norm/layer4": 10.12704610824585, "mean_norm/layer5": 12.597833693027496, "mean_norm/layer6": 9.629578769207, "mean_norm/layer7": 10.168816149234772, "mean_norm/layer8": 10.669798731803894, "mean_norm/layer9": 10.596307277679443, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10350 }, { "epoch": 4.32, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4666691003192141, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7238152027130127, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.83, "eval_samples_per_second": 20.372, "eval_steps_per_second": 0.676, "step": 10350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.34, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4675, "max_norm": 35.09250259399414, "max_norm/layer0": 27.170841217041016, "max_norm/layer1": 28.54010009765625, "max_norm/layer10": 30.02427864074707, "max_norm/layer11": 28.07108497619629, "max_norm/layer12": 31.37407684326172, "max_norm/layer13": 27.350177764892578, "max_norm/layer14": 28.96674156188965, "max_norm/layer15": 34.41961669921875, "max_norm/layer16": 28.634737014770508, "max_norm/layer17": 34.30854034423828, "max_norm/layer18": 30.215808868408203, "max_norm/layer19": 29.66392707824707, "max_norm/layer2": 22.399484634399414, "max_norm/layer20": 30.463783264160156, "max_norm/layer21": 30.12825584411621, "max_norm/layer22": 30.878080368041992, "max_norm/layer23": 29.53550910949707, "max_norm/layer3": 27.760766983032227, "max_norm/layer4": 27.49215316772461, "max_norm/layer5": 35.09250259399414, "max_norm/layer6": 23.237085342407227, "max_norm/layer7": 29.78689956665039, "max_norm/layer8": 29.529512405395508, "max_norm/layer9": 29.437997817993164, "mean_norm": 10.875869582096735, "mean_norm/layer0": 10.517846643924713, "mean_norm/layer1": 10.343126773834229, "mean_norm/layer10": 10.696803987026215, "mean_norm/layer11": 11.02418839931488, "mean_norm/layer12": 11.595861494541168, "mean_norm/layer13": 10.69503504037857, "mean_norm/layer14": 11.095302939414978, "mean_norm/layer15": 11.440791726112366, "mean_norm/layer16": 10.778616189956665, "mean_norm/layer17": 11.280155301094055, "mean_norm/layer18": 10.807569742202759, "mean_norm/layer19": 10.861127018928528, "mean_norm/layer2": 8.919726192951202, "mean_norm/layer20": 10.970995128154755, "mean_norm/layer21": 10.93109941482544, "mean_norm/layer22": 11.948687732219696, "mean_norm/layer23": 11.896688163280487, "mean_norm/layer3": 11.369346380233765, "mean_norm/layer4": 10.135048031806946, "mean_norm/layer5": 12.615287721157074, "mean_norm/layer6": 9.63567179441452, "mean_norm/layer7": 10.176795840263367, "mean_norm/layer8": 10.679445087909698, "mean_norm/layer9": 10.60565322637558, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10400 }, { "epoch": 4.34, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46639734245141823, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.720466136932373, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8264, "eval_samples_per_second": 20.378, "eval_steps_per_second": 0.676, "step": 10400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.36, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4832, "max_norm": 35.20648193359375, "max_norm/layer0": 27.249309539794922, "max_norm/layer1": 28.6260986328125, "max_norm/layer10": 30.132997512817383, "max_norm/layer11": 28.141712188720703, "max_norm/layer12": 31.486787796020508, "max_norm/layer13": 27.444744110107422, "max_norm/layer14": 29.066604614257812, "max_norm/layer15": 34.534122467041016, "max_norm/layer16": 28.72284698486328, "max_norm/layer17": 34.44967269897461, "max_norm/layer18": 30.303834915161133, "max_norm/layer19": 29.760055541992188, "max_norm/layer2": 22.440155029296875, "max_norm/layer20": 30.55260467529297, "max_norm/layer21": 30.21926498413086, "max_norm/layer22": 30.969770431518555, "max_norm/layer23": 29.619102478027344, "max_norm/layer3": 27.84838104248047, "max_norm/layer4": 27.581743240356445, "max_norm/layer5": 35.20648193359375, "max_norm/layer6": 23.2900447845459, "max_norm/layer7": 29.881126403808594, "max_norm/layer8": 29.612140655517578, "max_norm/layer9": 29.506317138671875, "mean_norm": 10.886188079913458, "mean_norm/layer0": 10.531225800514221, "mean_norm/layer1": 10.35285609960556, "mean_norm/layer10": 10.706222176551819, "mean_norm/layer11": 11.034725069999695, "mean_norm/layer12": 11.609041213989258, "mean_norm/layer13": 10.704964399337769, "mean_norm/layer14": 11.106115698814392, "mean_norm/layer15": 11.453032970428467, "mean_norm/layer16": 10.78825443983078, "mean_norm/layer17": 11.290884613990784, "mean_norm/layer18": 10.816619038581848, "mean_norm/layer19": 10.870469331741333, "mean_norm/layer2": 8.923380255699158, "mean_norm/layer20": 10.980166375637054, "mean_norm/layer21": 10.9404656291008, "mean_norm/layer22": 11.961466610431671, "mean_norm/layer23": 11.909380972385406, "mean_norm/layer3": 11.38276892900467, "mean_norm/layer4": 10.14309161901474, "mean_norm/layer5": 12.632707595825195, "mean_norm/layer6": 9.641742944717407, "mean_norm/layer7": 10.184781432151794, "mean_norm/layer8": 10.689123392105103, "mean_norm/layer9": 10.61502730846405, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10450 }, { "epoch": 4.36, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4669814190628004, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.727762460708618, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8074, "eval_samples_per_second": 20.411, "eval_steps_per_second": 0.678, "step": 10450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.38, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4735, "max_norm": 35.31102752685547, "max_norm/layer0": 27.322124481201172, "max_norm/layer1": 28.704631805419922, "max_norm/layer10": 30.22309684753418, "max_norm/layer11": 28.21150016784668, "max_norm/layer12": 31.58722686767578, "max_norm/layer13": 27.54606819152832, "max_norm/layer14": 29.150634765625, "max_norm/layer15": 34.65001678466797, "max_norm/layer16": 28.81109619140625, "max_norm/layer17": 34.57710266113281, "max_norm/layer18": 30.40672492980957, "max_norm/layer19": 29.857248306274414, "max_norm/layer2": 22.493066787719727, "max_norm/layer20": 30.625856399536133, "max_norm/layer21": 30.31292152404785, "max_norm/layer22": 31.06342887878418, "max_norm/layer23": 29.703598022460938, "max_norm/layer3": 27.929664611816406, "max_norm/layer4": 27.665664672851562, "max_norm/layer5": 35.31102752685547, "max_norm/layer6": 23.348833084106445, "max_norm/layer7": 29.977657318115234, "max_norm/layer8": 29.692916870117188, "max_norm/layer9": 29.58916473388672, "mean_norm": 10.896445403496424, "mean_norm/layer0": 10.544557332992554, "mean_norm/layer1": 10.36272656917572, "mean_norm/layer10": 10.715586066246033, "mean_norm/layer11": 11.045181214809418, "mean_norm/layer12": 11.622164130210876, "mean_norm/layer13": 10.71480655670166, "mean_norm/layer14": 11.11687183380127, "mean_norm/layer15": 11.465251564979553, "mean_norm/layer16": 10.797833800315857, "mean_norm/layer17": 11.301512777805328, "mean_norm/layer18": 10.825657427310944, "mean_norm/layer19": 10.87968373298645, "mean_norm/layer2": 8.926989018917084, "mean_norm/layer20": 10.989526093006134, "mean_norm/layer21": 10.949874520301819, "mean_norm/layer22": 11.974126279354095, "mean_norm/layer23": 11.922089457511902, "mean_norm/layer3": 11.395866453647614, "mean_norm/layer4": 10.151008665561676, "mean_norm/layer5": 12.650058627128601, "mean_norm/layer6": 9.647817850112915, "mean_norm/layer7": 10.19264006614685, "mean_norm/layer8": 10.698614120483398, "mean_norm/layer9": 10.624245524406433, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10500 }, { "epoch": 4.38, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46716394300385733, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.722189426422119, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8232, "eval_samples_per_second": 20.384, "eval_steps_per_second": 0.677, "step": 10500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.41, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4798, "max_norm": 35.41484069824219, "max_norm/layer0": 27.402650833129883, "max_norm/layer1": 28.785425186157227, "max_norm/layer10": 30.307842254638672, "max_norm/layer11": 28.27923011779785, "max_norm/layer12": 31.686256408691406, "max_norm/layer13": 27.649747848510742, "max_norm/layer14": 29.226646423339844, "max_norm/layer15": 34.76811599731445, "max_norm/layer16": 28.895538330078125, "max_norm/layer17": 34.68964385986328, "max_norm/layer18": 30.481956481933594, "max_norm/layer19": 29.93875503540039, "max_norm/layer2": 22.53553009033203, "max_norm/layer20": 30.70552635192871, "max_norm/layer21": 30.40555763244629, "max_norm/layer22": 31.15724754333496, "max_norm/layer23": 29.78316879272461, "max_norm/layer3": 28.027681350708008, "max_norm/layer4": 27.753910064697266, "max_norm/layer5": 35.41484069824219, "max_norm/layer6": 23.405353546142578, "max_norm/layer7": 30.058359146118164, "max_norm/layer8": 29.767122268676758, "max_norm/layer9": 29.67656135559082, "mean_norm": 10.90666925907135, "mean_norm/layer0": 10.55777508020401, "mean_norm/layer1": 10.37240594625473, "mean_norm/layer10": 10.724979639053345, "mean_norm/layer11": 11.055671870708466, "mean_norm/layer12": 11.635342717170715, "mean_norm/layer13": 10.724624454975128, "mean_norm/layer14": 11.127586245536804, "mean_norm/layer15": 11.477472305297852, "mean_norm/layer16": 10.807492911815643, "mean_norm/layer17": 11.312130510807037, "mean_norm/layer18": 10.83464765548706, "mean_norm/layer19": 10.888959348201752, "mean_norm/layer2": 8.930633246898651, "mean_norm/layer20": 10.998526573181152, "mean_norm/layer21": 10.959003448486328, "mean_norm/layer22": 11.986606121063232, "mean_norm/layer23": 11.93477600812912, "mean_norm/layer3": 11.40896886587143, "mean_norm/layer4": 10.158946633338928, "mean_norm/layer5": 12.667472839355469, "mean_norm/layer6": 9.653771996498108, "mean_norm/layer7": 10.20052433013916, "mean_norm/layer8": 10.7082160115242, "mean_norm/layer9": 10.63352745771408, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10550 }, { "epoch": 4.41, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4674235326089161, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7157599925994873, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8578, "eval_samples_per_second": 20.324, "eval_steps_per_second": 0.675, "step": 10550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.43, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4831, "max_norm": 35.51637649536133, "max_norm/layer0": 27.475908279418945, "max_norm/layer1": 28.86876106262207, "max_norm/layer10": 30.390464782714844, "max_norm/layer11": 28.36003303527832, "max_norm/layer12": 31.778034210205078, "max_norm/layer13": 27.747234344482422, "max_norm/layer14": 29.308727264404297, "max_norm/layer15": 34.87663650512695, "max_norm/layer16": 28.978439331054688, "max_norm/layer17": 34.80805587768555, "max_norm/layer18": 30.56378173828125, "max_norm/layer19": 30.048263549804688, "max_norm/layer2": 22.57395362854004, "max_norm/layer20": 30.787128448486328, "max_norm/layer21": 30.525808334350586, "max_norm/layer22": 31.266019821166992, "max_norm/layer23": 29.866968154907227, "max_norm/layer3": 28.12118911743164, "max_norm/layer4": 27.834333419799805, "max_norm/layer5": 35.51637649536133, "max_norm/layer6": 23.4639835357666, "max_norm/layer7": 30.14113998413086, "max_norm/layer8": 29.85468864440918, "max_norm/layer9": 29.7611026763916, "mean_norm": 10.916920227309069, "mean_norm/layer0": 10.570904314517975, "mean_norm/layer1": 10.38205361366272, "mean_norm/layer10": 10.734330654144287, "mean_norm/layer11": 11.066179275512695, "mean_norm/layer12": 11.64851301908493, "mean_norm/layer13": 10.73451679944992, "mean_norm/layer14": 11.138398826122284, "mean_norm/layer15": 11.48961079120636, "mean_norm/layer16": 10.817120850086212, "mean_norm/layer17": 11.322860479354858, "mean_norm/layer18": 10.843526363372803, "mean_norm/layer19": 10.898203313350677, "mean_norm/layer2": 8.934328258037567, "mean_norm/layer20": 11.007682263851166, "mean_norm/layer21": 10.968221306800842, "mean_norm/layer22": 11.999272584915161, "mean_norm/layer23": 11.947436928749084, "mean_norm/layer3": 11.422153949737549, "mean_norm/layer4": 10.166811406612396, "mean_norm/layer5": 12.684915959835052, "mean_norm/layer6": 9.659890413284302, "mean_norm/layer7": 10.20842158794403, "mean_norm/layer8": 10.717842519283295, "mean_norm/layer9": 10.642889976501465, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10600 }, { "epoch": 4.43, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4667339977204788, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7145159244537354, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8076, "eval_samples_per_second": 20.411, "eval_steps_per_second": 0.678, "step": 10600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.45, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4806, "max_norm": 35.609092712402344, "max_norm/layer0": 27.55437660217285, "max_norm/layer1": 28.942262649536133, "max_norm/layer10": 30.47496795654297, "max_norm/layer11": 28.428438186645508, "max_norm/layer12": 31.868505477905273, "max_norm/layer13": 27.855722427368164, "max_norm/layer14": 29.389577865600586, "max_norm/layer15": 34.96714401245117, "max_norm/layer16": 29.079998016357422, "max_norm/layer17": 34.91963577270508, "max_norm/layer18": 30.655733108520508, "max_norm/layer19": 30.14913558959961, "max_norm/layer2": 22.608745574951172, "max_norm/layer20": 30.87098503112793, "max_norm/layer21": 30.627986907958984, "max_norm/layer22": 31.354114532470703, "max_norm/layer23": 29.948514938354492, "max_norm/layer3": 28.209653854370117, "max_norm/layer4": 27.917613983154297, "max_norm/layer5": 35.609092712402344, "max_norm/layer6": 23.53098487854004, "max_norm/layer7": 30.23145294189453, "max_norm/layer8": 29.94053840637207, "max_norm/layer9": 29.844087600708008, "mean_norm": 10.927273042500019, "mean_norm/layer0": 10.584196090698242, "mean_norm/layer1": 10.391879200935364, "mean_norm/layer10": 10.74368441104889, "mean_norm/layer11": 11.076675713062286, "mean_norm/layer12": 11.661826848983765, "mean_norm/layer13": 10.744428396224976, "mean_norm/layer14": 11.149281024932861, "mean_norm/layer15": 11.501932203769684, "mean_norm/layer16": 10.826817870140076, "mean_norm/layer17": 11.333656907081604, "mean_norm/layer18": 10.852577328681946, "mean_norm/layer19": 10.907494246959686, "mean_norm/layer2": 8.938007533550262, "mean_norm/layer20": 11.017000377178192, "mean_norm/layer21": 10.977705717086792, "mean_norm/layer22": 12.012137532234192, "mean_norm/layer23": 11.960254788398743, "mean_norm/layer3": 11.435484945774078, "mean_norm/layer4": 10.174837708473206, "mean_norm/layer5": 12.702556490898132, "mean_norm/layer6": 9.666034281253815, "mean_norm/layer7": 10.216350853443146, "mean_norm/layer8": 10.727464079856873, "mean_norm/layer9": 10.652268469333649, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10650 }, { "epoch": 4.45, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46697736297522136, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7170541286468506, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.7982, "eval_samples_per_second": 20.427, "eval_steps_per_second": 0.678, "step": 10650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.47, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4783, "max_norm": 35.705467224121094, "max_norm/layer0": 27.62490463256836, "max_norm/layer1": 29.019390106201172, "max_norm/layer10": 30.577533721923828, "max_norm/layer11": 28.49982452392578, "max_norm/layer12": 31.976930618286133, "max_norm/layer13": 27.960256576538086, "max_norm/layer14": 29.463733673095703, "max_norm/layer15": 35.0821647644043, "max_norm/layer16": 29.184551239013672, "max_norm/layer17": 35.04167175292969, "max_norm/layer18": 30.749788284301758, "max_norm/layer19": 30.25857162475586, "max_norm/layer2": 22.64493751525879, "max_norm/layer20": 30.958097457885742, "max_norm/layer21": 30.731101989746094, "max_norm/layer22": 31.439579010009766, "max_norm/layer23": 30.029600143432617, "max_norm/layer3": 28.30475616455078, "max_norm/layer4": 28.00230598449707, "max_norm/layer5": 35.705467224121094, "max_norm/layer6": 23.597314834594727, "max_norm/layer7": 30.324081420898438, "max_norm/layer8": 30.024124145507812, "max_norm/layer9": 29.914560317993164, "mean_norm": 10.937589218219122, "mean_norm/layer0": 10.597443342208862, "mean_norm/layer1": 10.40154081583023, "mean_norm/layer10": 10.753035068511963, "mean_norm/layer11": 11.087162613868713, "mean_norm/layer12": 11.675267100334167, "mean_norm/layer13": 10.754276752471924, "mean_norm/layer14": 11.160140216350555, "mean_norm/layer15": 11.5142263174057, "mean_norm/layer16": 10.836543262004852, "mean_norm/layer17": 11.34443885087967, "mean_norm/layer18": 10.861545503139496, "mean_norm/layer19": 10.916850566864014, "mean_norm/layer2": 8.94169694185257, "mean_norm/layer20": 11.026383817195892, "mean_norm/layer21": 10.987124800682068, "mean_norm/layer22": 12.02495139837265, "mean_norm/layer23": 11.972956240177155, "mean_norm/layer3": 11.448661506175995, "mean_norm/layer4": 10.182782769203186, "mean_norm/layer5": 12.720122337341309, "mean_norm/layer6": 9.672084748744965, "mean_norm/layer7": 10.224287867546082, "mean_norm/layer8": 10.737088739871979, "mean_norm/layer9": 10.661529660224915, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10700 }, { "epoch": 4.47, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4673667473828095, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7178053855895996, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8381, "eval_samples_per_second": 20.358, "eval_steps_per_second": 0.676, "step": 10700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.49, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4828, "max_norm": 35.80092239379883, "max_norm/layer0": 27.704483032226562, "max_norm/layer1": 29.09988021850586, "max_norm/layer10": 30.672069549560547, "max_norm/layer11": 28.57552719116211, "max_norm/layer12": 32.09391403198242, "max_norm/layer13": 28.066116333007812, "max_norm/layer14": 29.550426483154297, "max_norm/layer15": 35.199127197265625, "max_norm/layer16": 29.278635025024414, "max_norm/layer17": 35.16794204711914, "max_norm/layer18": 30.849281311035156, "max_norm/layer19": 30.358570098876953, "max_norm/layer2": 22.691360473632812, "max_norm/layer20": 31.052244186401367, "max_norm/layer21": 30.848957061767578, "max_norm/layer22": 31.532005310058594, "max_norm/layer23": 30.109872817993164, "max_norm/layer3": 28.392465591430664, "max_norm/layer4": 28.095552444458008, "max_norm/layer5": 35.80092239379883, "max_norm/layer6": 23.654541015625, "max_norm/layer7": 30.412067413330078, "max_norm/layer8": 30.113658905029297, "max_norm/layer9": 29.99777603149414, "mean_norm": 10.947911076247692, "mean_norm/layer0": 10.610689520835876, "mean_norm/layer1": 10.411279439926147, "mean_norm/layer10": 10.762393414974213, "mean_norm/layer11": 11.097654044628143, "mean_norm/layer12": 11.688684284687042, "mean_norm/layer13": 10.764097929000854, "mean_norm/layer14": 11.170956254005432, "mean_norm/layer15": 11.526572465896606, "mean_norm/layer16": 10.846267402172089, "mean_norm/layer17": 11.355244040489197, "mean_norm/layer18": 10.870476722717285, "mean_norm/layer19": 10.926155745983124, "mean_norm/layer2": 8.945383906364441, "mean_norm/layer20": 11.035573720932007, "mean_norm/layer21": 10.996546864509583, "mean_norm/layer22": 12.03775930404663, "mean_norm/layer23": 11.985740721225739, "mean_norm/layer3": 11.461913466453552, "mean_norm/layer4": 10.19075322151184, "mean_norm/layer5": 12.737750947475433, "mean_norm/layer6": 9.67819058895111, "mean_norm/layer7": 10.232214033603668, "mean_norm/layer8": 10.746669948101044, "mean_norm/layer9": 10.670897841453552, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10750 }, { "epoch": 4.49, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4685267884304158, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7106406688690186, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8382, "eval_samples_per_second": 20.358, "eval_steps_per_second": 0.676, "step": 10750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.51, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4824, "max_norm": 35.902252197265625, "max_norm/layer0": 27.77450180053711, "max_norm/layer1": 29.19710922241211, "max_norm/layer10": 30.76256561279297, "max_norm/layer11": 28.64341926574707, "max_norm/layer12": 32.20515823364258, "max_norm/layer13": 28.149314880371094, "max_norm/layer14": 29.625675201416016, "max_norm/layer15": 35.318763732910156, "max_norm/layer16": 29.381330490112305, "max_norm/layer17": 35.283477783203125, "max_norm/layer18": 30.946577072143555, "max_norm/layer19": 30.443479537963867, "max_norm/layer2": 22.751590728759766, "max_norm/layer20": 31.136180877685547, "max_norm/layer21": 30.948503494262695, "max_norm/layer22": 31.631589889526367, "max_norm/layer23": 30.19828224182129, "max_norm/layer3": 28.473833084106445, "max_norm/layer4": 28.17934226989746, "max_norm/layer5": 35.902252197265625, "max_norm/layer6": 23.716323852539062, "max_norm/layer7": 30.506010055541992, "max_norm/layer8": 30.187671661376953, "max_norm/layer9": 30.072362899780273, "mean_norm": 10.958240871628126, "mean_norm/layer0": 10.623964190483093, "mean_norm/layer1": 10.421046495437622, "mean_norm/layer10": 10.771743476390839, "mean_norm/layer11": 11.10817575454712, "mean_norm/layer12": 11.702056527137756, "mean_norm/layer13": 10.774037420749664, "mean_norm/layer14": 11.181804180145264, "mean_norm/layer15": 11.53890997171402, "mean_norm/layer16": 10.85598087310791, "mean_norm/layer17": 11.366090714931488, "mean_norm/layer18": 10.879380404949188, "mean_norm/layer19": 10.935488760471344, "mean_norm/layer2": 8.94908481836319, "mean_norm/layer20": 11.04500299692154, "mean_norm/layer21": 11.00584191083908, "mean_norm/layer22": 12.050399005413055, "mean_norm/layer23": 11.998490035533905, "mean_norm/layer3": 11.475232481956482, "mean_norm/layer4": 10.198665499687195, "mean_norm/layer5": 12.75539767742157, "mean_norm/layer6": 9.684304535388947, "mean_norm/layer7": 10.240188002586365, "mean_norm/layer8": 10.756260454654694, "mean_norm/layer9": 10.680234730243683, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10800 }, { "epoch": 4.51, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4672450647554382, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7115914821624756, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8271, "eval_samples_per_second": 20.377, "eval_steps_per_second": 0.676, "step": 10800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.53, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4838, "max_norm": 36.001617431640625, "max_norm/layer0": 27.83734893798828, "max_norm/layer1": 29.293045043945312, "max_norm/layer10": 30.840595245361328, "max_norm/layer11": 28.707897186279297, "max_norm/layer12": 32.31393814086914, "max_norm/layer13": 28.230504989624023, "max_norm/layer14": 29.70939826965332, "max_norm/layer15": 35.45550537109375, "max_norm/layer16": 29.47163963317871, "max_norm/layer17": 35.38703536987305, "max_norm/layer18": 31.027469635009766, "max_norm/layer19": 30.52695655822754, "max_norm/layer2": 22.79546356201172, "max_norm/layer20": 31.22841453552246, "max_norm/layer21": 31.03502655029297, "max_norm/layer22": 31.733074188232422, "max_norm/layer23": 30.28806495666504, "max_norm/layer3": 28.55718421936035, "max_norm/layer4": 28.254390716552734, "max_norm/layer5": 36.001617431640625, "max_norm/layer6": 23.774742126464844, "max_norm/layer7": 30.59893798828125, "max_norm/layer8": 30.25242042541504, "max_norm/layer9": 30.142948150634766, "mean_norm": 10.968432190517584, "mean_norm/layer0": 10.637080550193787, "mean_norm/layer1": 10.430836737155914, "mean_norm/layer10": 10.781019687652588, "mean_norm/layer11": 11.118514716625214, "mean_norm/layer12": 11.715137422084808, "mean_norm/layer13": 10.78377228975296, "mean_norm/layer14": 11.192479372024536, "mean_norm/layer15": 11.551107704639435, "mean_norm/layer16": 10.865435600280762, "mean_norm/layer17": 11.376686751842499, "mean_norm/layer18": 10.888093769550323, "mean_norm/layer19": 10.944684505462646, "mean_norm/layer2": 8.952727675437927, "mean_norm/layer20": 11.054252862930298, "mean_norm/layer21": 11.015106618404388, "mean_norm/layer22": 12.062939047813416, "mean_norm/layer23": 12.011112213134766, "mean_norm/layer3": 11.488403975963593, "mean_norm/layer4": 10.206504702568054, "mean_norm/layer5": 12.77285772562027, "mean_norm/layer6": 9.69041132926941, "mean_norm/layer7": 10.248039662837982, "mean_norm/layer8": 10.765750110149384, "mean_norm/layer9": 10.689417541027069, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10850 }, { "epoch": 4.53, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46874987324726314, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7068047523498535, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8269, "eval_samples_per_second": 20.377, "eval_steps_per_second": 0.676, "step": 10850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.55, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4766, "max_norm": 36.10050964355469, "max_norm/layer0": 27.90643882751465, "max_norm/layer1": 29.393217086791992, "max_norm/layer10": 30.925491333007812, "max_norm/layer11": 28.774173736572266, "max_norm/layer12": 32.422420501708984, "max_norm/layer13": 28.32280921936035, "max_norm/layer14": 29.791353225708008, "max_norm/layer15": 35.58605194091797, "max_norm/layer16": 29.558443069458008, "max_norm/layer17": 35.482425689697266, "max_norm/layer18": 31.133277893066406, "max_norm/layer19": 30.631622314453125, "max_norm/layer2": 22.839784622192383, "max_norm/layer20": 31.314443588256836, "max_norm/layer21": 31.123477935791016, "max_norm/layer22": 31.825902938842773, "max_norm/layer23": 30.378795623779297, "max_norm/layer3": 28.63979148864746, "max_norm/layer4": 28.323528289794922, "max_norm/layer5": 36.10050964355469, "max_norm/layer6": 23.828092575073242, "max_norm/layer7": 30.709747314453125, "max_norm/layer8": 30.32479476928711, "max_norm/layer9": 30.2420654296875, "mean_norm": 10.978607185184956, "mean_norm/layer0": 10.650204837322235, "mean_norm/layer1": 10.440573155879974, "mean_norm/layer10": 10.79030156135559, "mean_norm/layer11": 11.128903448581696, "mean_norm/layer12": 11.7282093167305, "mean_norm/layer13": 10.793516874313354, "mean_norm/layer14": 11.203150153160095, "mean_norm/layer15": 11.563211679458618, "mean_norm/layer16": 10.874927461147308, "mean_norm/layer17": 11.387232065200806, "mean_norm/layer18": 10.896808683872223, "mean_norm/layer19": 10.953786313533783, "mean_norm/layer2": 8.956369996070862, "mean_norm/layer20": 11.063383102416992, "mean_norm/layer21": 11.024434506893158, "mean_norm/layer22": 12.075482964515686, "mean_norm/layer23": 12.023701608181, "mean_norm/layer3": 11.501590967178345, "mean_norm/layer4": 10.214413344860077, "mean_norm/layer5": 12.790341198444366, "mean_norm/layer6": 9.696370244026184, "mean_norm/layer7": 10.255893349647522, "mean_norm/layer8": 10.775194346904755, "mean_norm/layer9": 10.698571264743805, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10900 }, { "epoch": 4.55, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46807250662156297, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7072505950927734, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.5674, "eval_samples_per_second": 20.834, "eval_steps_per_second": 0.692, "step": 10900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.57, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4951, "max_norm": 36.194454193115234, "max_norm/layer0": 27.984460830688477, "max_norm/layer1": 29.48598289489746, "max_norm/layer10": 31.01220703125, "max_norm/layer11": 28.84075164794922, "max_norm/layer12": 32.5153694152832, "max_norm/layer13": 28.403606414794922, "max_norm/layer14": 29.87116241455078, "max_norm/layer15": 35.694305419921875, "max_norm/layer16": 29.650407791137695, "max_norm/layer17": 35.60575866699219, "max_norm/layer18": 31.23323631286621, "max_norm/layer19": 30.72925567626953, "max_norm/layer2": 22.884504318237305, "max_norm/layer20": 31.395549774169922, "max_norm/layer21": 31.2160587310791, "max_norm/layer22": 31.92021369934082, "max_norm/layer23": 30.462398529052734, "max_norm/layer3": 28.742555618286133, "max_norm/layer4": 28.39634132385254, "max_norm/layer5": 36.194454193115234, "max_norm/layer6": 23.88254737854004, "max_norm/layer7": 30.820144653320312, "max_norm/layer8": 30.39653205871582, "max_norm/layer9": 30.330341339111328, "mean_norm": 10.98867952823639, "mean_norm/layer0": 10.663160026073456, "mean_norm/layer1": 10.450208723545074, "mean_norm/layer10": 10.79953122138977, "mean_norm/layer11": 11.139248013496399, "mean_norm/layer12": 11.741204142570496, "mean_norm/layer13": 10.803188383579254, "mean_norm/layer14": 11.21361792087555, "mean_norm/layer15": 11.575240135192871, "mean_norm/layer16": 10.88437169790268, "mean_norm/layer17": 11.39776086807251, "mean_norm/layer18": 10.905632257461548, "mean_norm/layer19": 10.962841093540192, "mean_norm/layer2": 8.959905982017517, "mean_norm/layer20": 11.072368741035461, "mean_norm/layer21": 11.033558368682861, "mean_norm/layer22": 12.0879687666893, "mean_norm/layer23": 12.036184847354889, "mean_norm/layer3": 11.514626264572144, "mean_norm/layer4": 10.222147405147552, "mean_norm/layer5": 12.807550191879272, "mean_norm/layer6": 9.702159464359283, "mean_norm/layer7": 10.263650834560394, "mean_norm/layer8": 10.784475028514862, "mean_norm/layer9": 10.707708299160004, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 10950 }, { "epoch": 4.57, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4685105640800996, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7058496475219727, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8398, "eval_samples_per_second": 20.355, "eval_steps_per_second": 0.676, "step": 10950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.59, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4968, "max_norm": 36.29143142700195, "max_norm/layer0": 28.067821502685547, "max_norm/layer1": 29.572872161865234, "max_norm/layer10": 31.0950927734375, "max_norm/layer11": 28.908004760742188, "max_norm/layer12": 32.61347579956055, "max_norm/layer13": 28.48408317565918, "max_norm/layer14": 29.953489303588867, "max_norm/layer15": 35.82485580444336, "max_norm/layer16": 29.73497200012207, "max_norm/layer17": 35.71292495727539, "max_norm/layer18": 31.33292579650879, "max_norm/layer19": 30.821983337402344, "max_norm/layer2": 22.939258575439453, "max_norm/layer20": 31.488800048828125, "max_norm/layer21": 31.312997817993164, "max_norm/layer22": 32.024410247802734, "max_norm/layer23": 30.548397064208984, "max_norm/layer3": 28.828319549560547, "max_norm/layer4": 28.46470832824707, "max_norm/layer5": 36.29143142700195, "max_norm/layer6": 23.948667526245117, "max_norm/layer7": 30.933961868286133, "max_norm/layer8": 30.480300903320312, "max_norm/layer9": 30.43441390991211, "mean_norm": 10.99889350682497, "mean_norm/layer0": 10.676221072673798, "mean_norm/layer1": 10.459985494613647, "mean_norm/layer10": 10.808838605880737, "mean_norm/layer11": 11.149834871292114, "mean_norm/layer12": 11.754562199115753, "mean_norm/layer13": 10.812919557094574, "mean_norm/layer14": 11.22424590587616, "mean_norm/layer15": 11.587432563304901, "mean_norm/layer16": 10.893988728523254, "mean_norm/layer17": 11.408426642417908, "mean_norm/layer18": 10.914457440376282, "mean_norm/layer19": 10.971990644931793, "mean_norm/layer2": 8.963540971279144, "mean_norm/layer20": 11.081362009048462, "mean_norm/layer21": 11.042804539203644, "mean_norm/layer22": 12.100537717342377, "mean_norm/layer23": 12.048828661441803, "mean_norm/layer3": 11.527796804904938, "mean_norm/layer4": 10.23012900352478, "mean_norm/layer5": 12.824970602989197, "mean_norm/layer6": 9.708126485347748, "mean_norm/layer7": 10.271549999713898, "mean_norm/layer8": 10.793979287147522, "mean_norm/layer9": 10.716914355754852, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11000 }, { "epoch": 4.59, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46899323850200575, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.708869218826294, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8407, "eval_samples_per_second": 20.354, "eval_steps_per_second": 0.676, "step": 11000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.61, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5027, "max_norm": 36.38948440551758, "max_norm/layer0": 28.142681121826172, "max_norm/layer1": 29.65342903137207, "max_norm/layer10": 31.172306060791016, "max_norm/layer11": 28.979270935058594, "max_norm/layer12": 32.718421936035156, "max_norm/layer13": 28.559803009033203, "max_norm/layer14": 30.038625717163086, "max_norm/layer15": 35.952938079833984, "max_norm/layer16": 29.816696166992188, "max_norm/layer17": 35.83388900756836, "max_norm/layer18": 31.439905166625977, "max_norm/layer19": 30.919139862060547, "max_norm/layer2": 22.99624252319336, "max_norm/layer20": 31.571073532104492, "max_norm/layer21": 31.403352737426758, "max_norm/layer22": 32.12685012817383, "max_norm/layer23": 30.628877639770508, "max_norm/layer3": 28.90157699584961, "max_norm/layer4": 28.525489807128906, "max_norm/layer5": 36.38948440551758, "max_norm/layer6": 24.00628662109375, "max_norm/layer7": 31.039264678955078, "max_norm/layer8": 30.567359924316406, "max_norm/layer9": 30.537586212158203, "mean_norm": 11.008995535473028, "mean_norm/layer0": 10.68915969133377, "mean_norm/layer1": 10.46977412700653, "mean_norm/layer10": 10.818095445632935, "mean_norm/layer11": 11.16015911102295, "mean_norm/layer12": 11.767687618732452, "mean_norm/layer13": 10.822493731975555, "mean_norm/layer14": 11.234766364097595, "mean_norm/layer15": 11.599426746368408, "mean_norm/layer16": 10.903450429439545, "mean_norm/layer17": 11.418922483921051, "mean_norm/layer18": 10.923265159130096, "mean_norm/layer19": 10.981090009212494, "mean_norm/layer2": 8.967131793498993, "mean_norm/layer20": 11.090291917324066, "mean_norm/layer21": 11.05186927318573, "mean_norm/layer22": 12.113010346889496, "mean_norm/layer23": 12.061234652996063, "mean_norm/layer3": 11.540878176689148, "mean_norm/layer4": 10.238067269325256, "mean_norm/layer5": 12.84223461151123, "mean_norm/layer6": 9.714037954807281, "mean_norm/layer7": 10.279354095458984, "mean_norm/layer8": 10.803401052951813, "mean_norm/layer9": 10.726090788841248, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11050 }, { "epoch": 4.61, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4690013506771638, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7019741535186768, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6244, "eval_samples_per_second": 20.732, "eval_steps_per_second": 0.688, "step": 11050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.63, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4867, "max_norm": 36.485416412353516, "max_norm/layer0": 28.211668014526367, "max_norm/layer1": 29.72883415222168, "max_norm/layer10": 31.23760986328125, "max_norm/layer11": 29.053224563598633, "max_norm/layer12": 32.811614990234375, "max_norm/layer13": 28.64307975769043, "max_norm/layer14": 30.11770248413086, "max_norm/layer15": 36.074459075927734, "max_norm/layer16": 29.89780044555664, "max_norm/layer17": 35.94729232788086, "max_norm/layer18": 31.554128646850586, "max_norm/layer19": 31.01970100402832, "max_norm/layer2": 23.0423641204834, "max_norm/layer20": 31.650583267211914, "max_norm/layer21": 31.490772247314453, "max_norm/layer22": 32.22224426269531, "max_norm/layer23": 30.71469497680664, "max_norm/layer3": 28.968250274658203, "max_norm/layer4": 28.582042694091797, "max_norm/layer5": 36.485416412353516, "max_norm/layer6": 24.07797622680664, "max_norm/layer7": 31.14894676208496, "max_norm/layer8": 30.651403427124023, "max_norm/layer9": 30.636816024780273, "mean_norm": 11.019032259782156, "mean_norm/layer0": 10.701907813549042, "mean_norm/layer1": 10.479356586933136, "mean_norm/layer10": 10.827310979366302, "mean_norm/layer11": 11.170374512672424, "mean_norm/layer12": 11.780598878860474, "mean_norm/layer13": 10.83207768201828, "mean_norm/layer14": 11.245192289352417, "mean_norm/layer15": 11.61131465435028, "mean_norm/layer16": 10.912882566452026, "mean_norm/layer17": 11.429385244846344, "mean_norm/layer18": 10.932092487812042, "mean_norm/layer19": 10.990167617797852, "mean_norm/layer2": 8.970707833766937, "mean_norm/layer20": 11.099395036697388, "mean_norm/layer21": 11.060913383960724, "mean_norm/layer22": 12.12530916929245, "mean_norm/layer23": 12.073706030845642, "mean_norm/layer3": 11.553913176059723, "mean_norm/layer4": 10.24598515033722, "mean_norm/layer5": 12.85935389995575, "mean_norm/layer6": 9.71992015838623, "mean_norm/layer7": 10.287022113800049, "mean_norm/layer8": 10.812736868858337, "mean_norm/layer9": 10.73515009880066, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11100 }, { "epoch": 4.63, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4689810702392686, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.702160596847534, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8364, "eval_samples_per_second": 20.361, "eval_steps_per_second": 0.676, "step": 11100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.66, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4907, "max_norm": 36.590641021728516, "max_norm/layer0": 28.281400680541992, "max_norm/layer1": 29.814014434814453, "max_norm/layer10": 31.30912971496582, "max_norm/layer11": 29.127084732055664, "max_norm/layer12": 32.911705017089844, "max_norm/layer13": 28.726318359375, "max_norm/layer14": 30.1971435546875, "max_norm/layer15": 36.19831085205078, "max_norm/layer16": 29.989545822143555, "max_norm/layer17": 36.075653076171875, "max_norm/layer18": 31.639633178710938, "max_norm/layer19": 31.121540069580078, "max_norm/layer2": 23.09928321838379, "max_norm/layer20": 31.74033546447754, "max_norm/layer21": 31.588829040527344, "max_norm/layer22": 32.31295394897461, "max_norm/layer23": 30.793426513671875, "max_norm/layer3": 29.041465759277344, "max_norm/layer4": 28.63759994506836, "max_norm/layer5": 36.590641021728516, "max_norm/layer6": 24.13155746459961, "max_norm/layer7": 31.24675178527832, "max_norm/layer8": 30.736846923828125, "max_norm/layer9": 30.751882553100586, "mean_norm": 11.029068134725094, "mean_norm/layer0": 10.71463930606842, "mean_norm/layer1": 10.488974511623383, "mean_norm/layer10": 10.836424171924591, "mean_norm/layer11": 11.180540084838867, "mean_norm/layer12": 11.793593287467957, "mean_norm/layer13": 10.841667890548706, "mean_norm/layer14": 11.255710542201996, "mean_norm/layer15": 11.62320464849472, "mean_norm/layer16": 10.922313868999481, "mean_norm/layer17": 11.43975281715393, "mean_norm/layer18": 10.94078254699707, "mean_norm/layer19": 10.999189674854279, "mean_norm/layer2": 8.97431856393814, "mean_norm/layer20": 11.108398020267487, "mean_norm/layer21": 11.070019721984863, "mean_norm/layer22": 12.137679636478424, "mean_norm/layer23": 12.086146414279938, "mean_norm/layer3": 11.566857933998108, "mean_norm/layer4": 10.25378680229187, "mean_norm/layer5": 12.876568496227264, "mean_norm/layer6": 9.725827276706696, "mean_norm/layer7": 10.294805943965912, "mean_norm/layer8": 10.822121918201447, "mean_norm/layer9": 10.744311153888702, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11150 }, { "epoch": 4.66, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46954892250033464, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.702021360397339, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8177, "eval_samples_per_second": 20.393, "eval_steps_per_second": 0.677, "step": 11150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.68, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4889, "max_norm": 36.693843841552734, "max_norm/layer0": 28.353055953979492, "max_norm/layer1": 29.90206527709961, "max_norm/layer10": 31.385793685913086, "max_norm/layer11": 29.21958351135254, "max_norm/layer12": 33.02078628540039, "max_norm/layer13": 28.812292098999023, "max_norm/layer14": 30.27202606201172, "max_norm/layer15": 36.33440399169922, "max_norm/layer16": 30.099519729614258, "max_norm/layer17": 36.19306564331055, "max_norm/layer18": 31.73409652709961, "max_norm/layer19": 31.216930389404297, "max_norm/layer2": 23.159343719482422, "max_norm/layer20": 31.83723258972168, "max_norm/layer21": 31.70283317565918, "max_norm/layer22": 32.40229034423828, "max_norm/layer23": 30.87533187866211, "max_norm/layer3": 29.103801727294922, "max_norm/layer4": 28.69968605041504, "max_norm/layer5": 36.693843841552734, "max_norm/layer6": 24.19968032836914, "max_norm/layer7": 31.33868980407715, "max_norm/layer8": 30.82036018371582, "max_norm/layer9": 30.858015060424805, "mean_norm": 11.039107086757818, "mean_norm/layer0": 10.727317333221436, "mean_norm/layer1": 10.498592138290405, "mean_norm/layer10": 10.845584452152252, "mean_norm/layer11": 11.190867006778717, "mean_norm/layer12": 11.806601226329803, "mean_norm/layer13": 10.851321637630463, "mean_norm/layer14": 11.26624971628189, "mean_norm/layer15": 11.63513070344925, "mean_norm/layer16": 10.931711971759796, "mean_norm/layer17": 11.450206220149994, "mean_norm/layer18": 10.949472665786743, "mean_norm/layer19": 11.008228719234467, "mean_norm/layer2": 8.977922022342682, "mean_norm/layer20": 11.11731094121933, "mean_norm/layer21": 11.079086363315582, "mean_norm/layer22": 12.150035500526428, "mean_norm/layer23": 12.098583281040192, "mean_norm/layer3": 11.579851865768433, "mean_norm/layer4": 10.261609435081482, "mean_norm/layer5": 12.89377510547638, "mean_norm/layer6": 9.731728971004486, "mean_norm/layer7": 10.302535831928253, "mean_norm/layer8": 10.831456780433655, "mean_norm/layer9": 10.753390192985535, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11200 }, { "epoch": 4.68, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4700640456228731, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7000200748443604, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8823, "eval_samples_per_second": 20.282, "eval_steps_per_second": 0.673, "step": 11200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.7, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4911, "max_norm": 36.80110168457031, "max_norm/layer0": 28.42072105407715, "max_norm/layer1": 29.987051010131836, "max_norm/layer10": 31.46202850341797, "max_norm/layer11": 29.302335739135742, "max_norm/layer12": 33.13109588623047, "max_norm/layer13": 28.901945114135742, "max_norm/layer14": 30.360057830810547, "max_norm/layer15": 36.44215393066406, "max_norm/layer16": 30.18164825439453, "max_norm/layer17": 36.3160285949707, "max_norm/layer18": 31.817520141601562, "max_norm/layer19": 31.32172966003418, "max_norm/layer2": 23.22319984436035, "max_norm/layer20": 31.919742584228516, "max_norm/layer21": 31.79605484008789, "max_norm/layer22": 32.49842834472656, "max_norm/layer23": 30.966951370239258, "max_norm/layer3": 29.168514251708984, "max_norm/layer4": 28.76665496826172, "max_norm/layer5": 36.80110168457031, "max_norm/layer6": 24.263078689575195, "max_norm/layer7": 31.429777145385742, "max_norm/layer8": 30.894712448120117, "max_norm/layer9": 30.976171493530273, "mean_norm": 11.049177487691244, "mean_norm/layer0": 10.739985823631287, "mean_norm/layer1": 10.5082568526268, "mean_norm/layer10": 10.85473507642746, "mean_norm/layer11": 11.201318681240082, "mean_norm/layer12": 11.819770455360413, "mean_norm/layer13": 10.861029326915741, "mean_norm/layer14": 11.276723444461823, "mean_norm/layer15": 11.647155404090881, "mean_norm/layer16": 10.941185355186462, "mean_norm/layer17": 11.46070909500122, "mean_norm/layer18": 10.958095967769623, "mean_norm/layer19": 11.017280280590057, "mean_norm/layer2": 8.981531858444214, "mean_norm/layer20": 11.126353204250336, "mean_norm/layer21": 11.088174939155579, "mean_norm/layer22": 12.162321031093597, "mean_norm/layer23": 12.111066281795502, "mean_norm/layer3": 11.59280115365982, "mean_norm/layer4": 10.269557535648346, "mean_norm/layer5": 12.910930395126343, "mean_norm/layer6": 9.737641453742981, "mean_norm/layer7": 10.310417890548706, "mean_norm/layer8": 10.840794563293457, "mean_norm/layer9": 10.762423634529114, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11250 }, { "epoch": 4.7, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4693420620338034, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6996147632598877, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.838, "eval_samples_per_second": 20.358, "eval_steps_per_second": 0.676, "step": 11250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.72, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4906, "max_norm": 36.90290832519531, "max_norm/layer0": 28.498428344726562, "max_norm/layer1": 30.071109771728516, "max_norm/layer10": 31.552982330322266, "max_norm/layer11": 29.381942749023438, "max_norm/layer12": 33.24612045288086, "max_norm/layer13": 28.998634338378906, "max_norm/layer14": 30.43010902404785, "max_norm/layer15": 36.54443359375, "max_norm/layer16": 30.27066993713379, "max_norm/layer17": 36.46219253540039, "max_norm/layer18": 31.914384841918945, "max_norm/layer19": 31.426963806152344, "max_norm/layer2": 23.282331466674805, "max_norm/layer20": 32.007347106933594, "max_norm/layer21": 31.882448196411133, "max_norm/layer22": 32.59296417236328, "max_norm/layer23": 31.06037712097168, "max_norm/layer3": 29.24478530883789, "max_norm/layer4": 28.834274291992188, "max_norm/layer5": 36.90290832519531, "max_norm/layer6": 24.324382781982422, "max_norm/layer7": 31.510684967041016, "max_norm/layer8": 30.968204498291016, "max_norm/layer9": 31.075193405151367, "mean_norm": 11.05928177634875, "mean_norm/layer0": 10.7528635263443, "mean_norm/layer1": 10.51784473657608, "mean_norm/layer10": 10.863938212394714, "mean_norm/layer11": 11.211776793003082, "mean_norm/layer12": 11.832974255084991, "mean_norm/layer13": 10.870778441429138, "mean_norm/layer14": 11.287272453308105, "mean_norm/layer15": 11.65920740365982, "mean_norm/layer16": 10.950676381587982, "mean_norm/layer17": 11.471208274364471, "mean_norm/layer18": 10.96678340435028, "mean_norm/layer19": 11.026268124580383, "mean_norm/layer2": 8.985169887542725, "mean_norm/layer20": 11.135346353054047, "mean_norm/layer21": 11.097164869308472, "mean_norm/layer22": 12.174674391746521, "mean_norm/layer23": 12.123576819896698, "mean_norm/layer3": 11.605943202972412, "mean_norm/layer4": 10.27738219499588, "mean_norm/layer5": 12.928228676319122, "mean_norm/layer6": 9.743575870990753, "mean_norm/layer7": 10.318305909633636, "mean_norm/layer8": 10.850202322006226, "mean_norm/layer9": 10.771600127220154, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11300 }, { "epoch": 4.72, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46931366942075015, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.702225923538208, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8556, "eval_samples_per_second": 20.328, "eval_steps_per_second": 0.675, "step": 11300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.74, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5083, "max_norm": 36.998252868652344, "max_norm/layer0": 28.57436180114746, "max_norm/layer1": 30.16019058227539, "max_norm/layer10": 31.637813568115234, "max_norm/layer11": 29.452293395996094, "max_norm/layer12": 33.34236145019531, "max_norm/layer13": 29.110563278198242, "max_norm/layer14": 30.50075340270996, "max_norm/layer15": 36.65324783325195, "max_norm/layer16": 30.35845184326172, "max_norm/layer17": 36.59389877319336, "max_norm/layer18": 32.02538299560547, "max_norm/layer19": 31.53948211669922, "max_norm/layer2": 23.335365295410156, "max_norm/layer20": 32.10725402832031, "max_norm/layer21": 31.964698791503906, "max_norm/layer22": 32.67811584472656, "max_norm/layer23": 31.14203643798828, "max_norm/layer3": 29.3145809173584, "max_norm/layer4": 28.908462524414062, "max_norm/layer5": 36.998252868652344, "max_norm/layer6": 24.38912010192871, "max_norm/layer7": 31.59634017944336, "max_norm/layer8": 31.052322387695312, "max_norm/layer9": 31.170902252197266, "mean_norm": 11.069261901080608, "mean_norm/layer0": 10.765595376491547, "mean_norm/layer1": 10.527443945407867, "mean_norm/layer10": 10.873034358024597, "mean_norm/layer11": 11.221920251846313, "mean_norm/layer12": 11.84593778848648, "mean_norm/layer13": 10.880328059196472, "mean_norm/layer14": 11.29772400856018, "mean_norm/layer15": 11.67112535238266, "mean_norm/layer16": 10.96004843711853, "mean_norm/layer17": 11.481589019298553, "mean_norm/layer18": 10.9753977060318, "mean_norm/layer19": 11.03517997264862, "mean_norm/layer2": 8.98877876996994, "mean_norm/layer20": 11.144243478775024, "mean_norm/layer21": 11.106104969978333, "mean_norm/layer22": 12.18696117401123, "mean_norm/layer23": 12.135864198207855, "mean_norm/layer3": 11.618866682052612, "mean_norm/layer4": 10.285234451293945, "mean_norm/layer5": 12.945219874382019, "mean_norm/layer6": 9.74939090013504, "mean_norm/layer7": 10.32614415884018, "mean_norm/layer8": 10.859492838382721, "mean_norm/layer9": 10.780659854412079, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11350 }, { "epoch": 4.74, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.470055933447715, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.698378086090088, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8271, "eval_samples_per_second": 20.377, "eval_steps_per_second": 0.676, "step": 11350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.76, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4982, "max_norm": 37.1029052734375, "max_norm/layer0": 28.656028747558594, "max_norm/layer1": 30.25836181640625, "max_norm/layer10": 31.71713638305664, "max_norm/layer11": 29.52212905883789, "max_norm/layer12": 33.44416427612305, "max_norm/layer13": 29.218441009521484, "max_norm/layer14": 30.57339859008789, "max_norm/layer15": 36.7493896484375, "max_norm/layer16": 30.460256576538086, "max_norm/layer17": 36.72866439819336, "max_norm/layer18": 32.121299743652344, "max_norm/layer19": 31.664583206176758, "max_norm/layer2": 23.3944091796875, "max_norm/layer20": 32.202659606933594, "max_norm/layer21": 32.049556732177734, "max_norm/layer22": 32.76599884033203, "max_norm/layer23": 31.217979431152344, "max_norm/layer3": 29.3818416595459, "max_norm/layer4": 28.99262046813965, "max_norm/layer5": 37.1029052734375, "max_norm/layer6": 24.457334518432617, "max_norm/layer7": 31.686601638793945, "max_norm/layer8": 31.13671112060547, "max_norm/layer9": 31.269529342651367, "mean_norm": 11.079338165620962, "mean_norm/layer0": 10.778338432312012, "mean_norm/layer1": 10.537169218063354, "mean_norm/layer10": 10.882223546504974, "mean_norm/layer11": 11.232254266738892, "mean_norm/layer12": 11.85909241437912, "mean_norm/layer13": 10.889939963817596, "mean_norm/layer14": 11.308136761188507, "mean_norm/layer15": 11.683177769184113, "mean_norm/layer16": 10.969454109668732, "mean_norm/layer17": 11.491996049880981, "mean_norm/layer18": 10.984146773815155, "mean_norm/layer19": 11.04429715871811, "mean_norm/layer2": 8.992380321025848, "mean_norm/layer20": 11.153231382369995, "mean_norm/layer21": 11.115254282951355, "mean_norm/layer22": 12.199417114257812, "mean_norm/layer23": 12.148304343223572, "mean_norm/layer3": 11.631822049617767, "mean_norm/layer4": 10.293142974376678, "mean_norm/layer5": 12.962431788444519, "mean_norm/layer6": 9.755285799503326, "mean_norm/layer7": 10.333933413028717, "mean_norm/layer8": 10.86891096830368, "mean_norm/layer9": 10.78977507352829, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11400 }, { "epoch": 4.76, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4695732590258089, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.696803092956543, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8371, "eval_samples_per_second": 20.36, "eval_steps_per_second": 0.676, "step": 11400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.78, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4981, "max_norm": 37.19981384277344, "max_norm/layer0": 28.733051300048828, "max_norm/layer1": 30.349668502807617, "max_norm/layer10": 31.805160522460938, "max_norm/layer11": 29.594594955444336, "max_norm/layer12": 33.550926208496094, "max_norm/layer13": 29.31583595275879, "max_norm/layer14": 30.652856826782227, "max_norm/layer15": 36.8530387878418, "max_norm/layer16": 30.553306579589844, "max_norm/layer17": 36.866615295410156, "max_norm/layer18": 32.23554992675781, "max_norm/layer19": 31.7749080657959, "max_norm/layer2": 23.452619552612305, "max_norm/layer20": 32.29941177368164, "max_norm/layer21": 32.140113830566406, "max_norm/layer22": 32.85822677612305, "max_norm/layer23": 31.301639556884766, "max_norm/layer3": 29.454954147338867, "max_norm/layer4": 29.073352813720703, "max_norm/layer5": 37.19981384277344, "max_norm/layer6": 24.528331756591797, "max_norm/layer7": 31.778316497802734, "max_norm/layer8": 31.21552085876465, "max_norm/layer9": 31.349042892456055, "mean_norm": 11.089381170769533, "mean_norm/layer0": 10.790962219238281, "mean_norm/layer1": 10.546747326850891, "mean_norm/layer10": 10.89135366678238, "mean_norm/layer11": 11.24245822429657, "mean_norm/layer12": 11.872169077396393, "mean_norm/layer13": 10.899617612361908, "mean_norm/layer14": 11.318670332431793, "mean_norm/layer15": 11.695177555084229, "mean_norm/layer16": 10.97891902923584, "mean_norm/layer17": 11.502409100532532, "mean_norm/layer18": 10.992907166481018, "mean_norm/layer19": 11.053321421146393, "mean_norm/layer2": 8.995991051197052, "mean_norm/layer20": 11.16218513250351, "mean_norm/layer21": 11.124274849891663, "mean_norm/layer22": 12.21173882484436, "mean_norm/layer23": 12.160701274871826, "mean_norm/layer3": 11.644759356975555, "mean_norm/layer4": 10.301061511039734, "mean_norm/layer5": 12.979609191417694, "mean_norm/layer6": 9.761213302612305, "mean_norm/layer7": 10.34174370765686, "mean_norm/layer8": 10.878252863883972, "mean_norm/layer9": 10.798904299736023, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11450 }, { "epoch": 4.78, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4699666995209761, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6955602169036865, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6354, "eval_samples_per_second": 20.713, "eval_steps_per_second": 0.688, "step": 11450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.8, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5003, "max_norm": 37.291603088378906, "max_norm/layer0": 28.814542770385742, "max_norm/layer1": 30.436798095703125, "max_norm/layer10": 31.88617706298828, "max_norm/layer11": 29.67328453063965, "max_norm/layer12": 33.657833099365234, "max_norm/layer13": 29.41160011291504, "max_norm/layer14": 30.73747444152832, "max_norm/layer15": 36.9760856628418, "max_norm/layer16": 30.654407501220703, "max_norm/layer17": 36.99338912963867, "max_norm/layer18": 32.32841110229492, "max_norm/layer19": 31.86827850341797, "max_norm/layer2": 23.515026092529297, "max_norm/layer20": 32.38021469116211, "max_norm/layer21": 32.233619689941406, "max_norm/layer22": 32.957420349121094, "max_norm/layer23": 31.38813018798828, "max_norm/layer3": 29.526674270629883, "max_norm/layer4": 29.14989471435547, "max_norm/layer5": 37.291603088378906, "max_norm/layer6": 24.593555450439453, "max_norm/layer7": 31.88994026184082, "max_norm/layer8": 31.295120239257812, "max_norm/layer9": 31.42879295349121, "mean_norm": 11.099412376681963, "mean_norm/layer0": 10.803522825241089, "mean_norm/layer1": 10.556218922138214, "mean_norm/layer10": 10.900573432445526, "mean_norm/layer11": 11.252809882164001, "mean_norm/layer12": 11.885180056095123, "mean_norm/layer13": 10.90925019979477, "mean_norm/layer14": 11.329178392887115, "mean_norm/layer15": 11.707133948802948, "mean_norm/layer16": 10.988328516483307, "mean_norm/layer17": 11.51287591457367, "mean_norm/layer18": 11.001640021800995, "mean_norm/layer19": 11.062367856502533, "mean_norm/layer2": 8.999559462070465, "mean_norm/layer20": 11.171233415603638, "mean_norm/layer21": 11.133346021175385, "mean_norm/layer22": 12.224068105220795, "mean_norm/layer23": 12.173038482666016, "mean_norm/layer3": 11.657609105110168, "mean_norm/layer4": 10.308907628059387, "mean_norm/layer5": 12.996685802936554, "mean_norm/layer6": 9.767203569412231, "mean_norm/layer7": 10.3494833111763, "mean_norm/layer8": 10.887590944766998, "mean_norm/layer9": 10.808091223239899, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11500 }, { "epoch": 4.8, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4696584368649688, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6966724395751953, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8337, "eval_samples_per_second": 20.366, "eval_steps_per_second": 0.676, "step": 11500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.82, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5146, "max_norm": 37.38665008544922, "max_norm/layer0": 28.893375396728516, "max_norm/layer1": 30.520029067993164, "max_norm/layer10": 31.96396255493164, "max_norm/layer11": 29.7481632232666, "max_norm/layer12": 33.75273513793945, "max_norm/layer13": 29.522672653198242, "max_norm/layer14": 30.82471466064453, "max_norm/layer15": 37.11414337158203, "max_norm/layer16": 30.747474670410156, "max_norm/layer17": 37.13072204589844, "max_norm/layer18": 32.423282623291016, "max_norm/layer19": 31.967445373535156, "max_norm/layer2": 23.584957122802734, "max_norm/layer20": 32.46532440185547, "max_norm/layer21": 32.333984375, "max_norm/layer22": 33.03456497192383, "max_norm/layer23": 31.466445922851562, "max_norm/layer3": 29.594579696655273, "max_norm/layer4": 29.243301391601562, "max_norm/layer5": 37.38665008544922, "max_norm/layer6": 24.651927947998047, "max_norm/layer7": 31.993391036987305, "max_norm/layer8": 31.371482849121094, "max_norm/layer9": 31.511945724487305, "mean_norm": 11.10927926003933, "mean_norm/layer0": 10.81601083278656, "mean_norm/layer1": 10.565600395202637, "mean_norm/layer10": 10.909658670425415, "mean_norm/layer11": 11.262958586215973, "mean_norm/layer12": 11.898052752017975, "mean_norm/layer13": 10.91872924566269, "mean_norm/layer14": 11.339493930339813, "mean_norm/layer15": 11.718998372554779, "mean_norm/layer16": 10.997642517089844, "mean_norm/layer17": 11.523203492164612, "mean_norm/layer18": 11.01017940044403, "mean_norm/layer19": 11.071209847927094, "mean_norm/layer2": 9.003080189228058, "mean_norm/layer20": 11.179914832115173, "mean_norm/layer21": 11.142175793647766, "mean_norm/layer22": 12.23628032207489, "mean_norm/layer23": 12.185180723667145, "mean_norm/layer3": 11.6702880859375, "mean_norm/layer4": 10.316582083702087, "mean_norm/layer5": 13.013548851013184, "mean_norm/layer6": 9.772991418838501, "mean_norm/layer7": 10.357124924659729, "mean_norm/layer8": 10.896804749965668, "mean_norm/layer9": 10.816992223262787, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11550 }, { "epoch": 4.82, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47042098132982885, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.691270589828491, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6472, "eval_samples_per_second": 20.692, "eval_steps_per_second": 0.687, "step": 11550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.84, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5026, "max_norm": 37.47762680053711, "max_norm/layer0": 28.971616744995117, "max_norm/layer1": 30.603607177734375, "max_norm/layer10": 32.050777435302734, "max_norm/layer11": 29.829021453857422, "max_norm/layer12": 33.8441162109375, "max_norm/layer13": 29.632450103759766, "max_norm/layer14": 30.915212631225586, "max_norm/layer15": 37.232913970947266, "max_norm/layer16": 30.840450286865234, "max_norm/layer17": 37.286354064941406, "max_norm/layer18": 32.52165985107422, "max_norm/layer19": 32.06243896484375, "max_norm/layer2": 23.63981819152832, "max_norm/layer20": 32.5574836730957, "max_norm/layer21": 32.43302536010742, "max_norm/layer22": 33.13492202758789, "max_norm/layer23": 31.543638229370117, "max_norm/layer3": 29.668012619018555, "max_norm/layer4": 29.327556610107422, "max_norm/layer5": 37.47762680053711, "max_norm/layer6": 24.719707489013672, "max_norm/layer7": 32.09111022949219, "max_norm/layer8": 31.45081901550293, "max_norm/layer9": 31.5856876373291, "mean_norm": 11.11912084867557, "mean_norm/layer0": 10.828483998775482, "mean_norm/layer1": 10.574886500835419, "mean_norm/layer10": 10.918683588504791, "mean_norm/layer11": 11.27305418252945, "mean_norm/layer12": 11.910798013210297, "mean_norm/layer13": 10.928040564060211, "mean_norm/layer14": 11.349718570709229, "mean_norm/layer15": 11.730824649333954, "mean_norm/layer16": 11.00691682100296, "mean_norm/layer17": 11.53353351354599, "mean_norm/layer18": 11.018724083900452, "mean_norm/layer19": 11.080044209957123, "mean_norm/layer2": 9.00660353899002, "mean_norm/layer20": 11.188700079917908, "mean_norm/layer21": 11.151018679141998, "mean_norm/layer22": 12.248418152332306, "mean_norm/layer23": 12.19741666316986, "mean_norm/layer3": 11.682981371879578, "mean_norm/layer4": 10.324283599853516, "mean_norm/layer5": 13.030375838279724, "mean_norm/layer6": 9.778766095638275, "mean_norm/layer7": 10.364711105823517, "mean_norm/layer8": 10.906016230583191, "mean_norm/layer9": 10.825900316238403, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11600 }, { "epoch": 4.84, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47171892935512266, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.687462568283081, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8212, "eval_samples_per_second": 22.271, "eval_steps_per_second": 0.739, "step": 11600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.86, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5085, "max_norm": 37.56265640258789, "max_norm/layer0": 29.0488224029541, "max_norm/layer1": 30.683454513549805, "max_norm/layer10": 32.14421844482422, "max_norm/layer11": 29.910310745239258, "max_norm/layer12": 33.934776306152344, "max_norm/layer13": 29.738357543945312, "max_norm/layer14": 30.991455078125, "max_norm/layer15": 37.36259841918945, "max_norm/layer16": 30.928890228271484, "max_norm/layer17": 37.42397689819336, "max_norm/layer18": 32.626399993896484, "max_norm/layer19": 32.142608642578125, "max_norm/layer2": 23.6883544921875, "max_norm/layer20": 32.648311614990234, "max_norm/layer21": 32.51786804199219, "max_norm/layer22": 33.245933532714844, "max_norm/layer23": 31.61872673034668, "max_norm/layer3": 29.742652893066406, "max_norm/layer4": 29.407451629638672, "max_norm/layer5": 37.56265640258789, "max_norm/layer6": 24.781131744384766, "max_norm/layer7": 32.19428253173828, "max_norm/layer8": 31.526046752929688, "max_norm/layer9": 31.649673461914062, "mean_norm": 11.12895734856526, "mean_norm/layer0": 10.840919971466064, "mean_norm/layer1": 10.584234595298767, "mean_norm/layer10": 10.927650392055511, "mean_norm/layer11": 11.283041536808014, "mean_norm/layer12": 11.923579931259155, "mean_norm/layer13": 10.937540829181671, "mean_norm/layer14": 11.360036492347717, "mean_norm/layer15": 11.742550194263458, "mean_norm/layer16": 11.016173362731934, "mean_norm/layer17": 11.543751299381256, "mean_norm/layer18": 11.027178168296814, "mean_norm/layer19": 11.088969767093658, "mean_norm/layer2": 9.010113298892975, "mean_norm/layer20": 11.197400689125061, "mean_norm/layer21": 11.159915804862976, "mean_norm/layer22": 12.260593712329865, "mean_norm/layer23": 12.209560513496399, "mean_norm/layer3": 11.695660948753357, "mean_norm/layer4": 10.331953763961792, "mean_norm/layer5": 13.04720538854599, "mean_norm/layer6": 9.784554660320282, "mean_norm/layer7": 10.37237673997879, "mean_norm/layer8": 10.91523164510727, "mean_norm/layer9": 10.834782660007477, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11650 }, { "epoch": 4.86, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47108617969279193, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6874008178710938, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8478, "eval_samples_per_second": 20.341, "eval_steps_per_second": 0.675, "step": 11650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.89, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5063, "max_norm": 37.657135009765625, "max_norm/layer0": 29.120641708374023, "max_norm/layer1": 30.76626205444336, "max_norm/layer10": 32.23412322998047, "max_norm/layer11": 29.978626251220703, "max_norm/layer12": 34.04027557373047, "max_norm/layer13": 29.84294891357422, "max_norm/layer14": 31.073169708251953, "max_norm/layer15": 37.47862243652344, "max_norm/layer16": 31.013898849487305, "max_norm/layer17": 37.55109786987305, "max_norm/layer18": 32.71333694458008, "max_norm/layer19": 32.22544860839844, "max_norm/layer2": 23.74456214904785, "max_norm/layer20": 32.7411003112793, "max_norm/layer21": 32.6014518737793, "max_norm/layer22": 33.357295989990234, "max_norm/layer23": 31.693147659301758, "max_norm/layer3": 29.81475257873535, "max_norm/layer4": 29.48421287536621, "max_norm/layer5": 37.657135009765625, "max_norm/layer6": 24.843406677246094, "max_norm/layer7": 32.288936614990234, "max_norm/layer8": 31.590938568115234, "max_norm/layer9": 31.715600967407227, "mean_norm": 11.138802573084831, "mean_norm/layer0": 10.853290915489197, "mean_norm/layer1": 10.593591392040253, "mean_norm/layer10": 10.93671852350235, "mean_norm/layer11": 11.29314911365509, "mean_norm/layer12": 11.936418116092682, "mean_norm/layer13": 10.9469895362854, "mean_norm/layer14": 11.370279312133789, "mean_norm/layer15": 11.754273056983948, "mean_norm/layer16": 11.025372207164764, "mean_norm/layer17": 11.554012775421143, "mean_norm/layer18": 11.035687029361725, "mean_norm/layer19": 11.097853183746338, "mean_norm/layer2": 9.013607859611511, "mean_norm/layer20": 11.206229448318481, "mean_norm/layer21": 11.168822050094604, "mean_norm/layer22": 12.272729098796844, "mean_norm/layer23": 12.221702218055725, "mean_norm/layer3": 11.708347916603088, "mean_norm/layer4": 10.339655816555023, "mean_norm/layer5": 13.06405371427536, "mean_norm/layer6": 9.790289580821991, "mean_norm/layer7": 10.380003929138184, "mean_norm/layer8": 10.924476206302643, "mean_norm/layer9": 10.843708753585815, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11700 }, { "epoch": 4.89, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47012488693655874, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.693180561065674, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8334, "eval_samples_per_second": 20.366, "eval_steps_per_second": 0.676, "step": 11700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.91, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5059, "max_norm": 37.756587982177734, "max_norm/layer0": 29.19428253173828, "max_norm/layer1": 30.85544204711914, "max_norm/layer10": 32.325218200683594, "max_norm/layer11": 30.0484619140625, "max_norm/layer12": 34.143394470214844, "max_norm/layer13": 29.933761596679688, "max_norm/layer14": 31.147777557373047, "max_norm/layer15": 37.59746551513672, "max_norm/layer16": 31.10285758972168, "max_norm/layer17": 37.67106628417969, "max_norm/layer18": 32.811126708984375, "max_norm/layer19": 32.30681610107422, "max_norm/layer2": 23.80467987060547, "max_norm/layer20": 32.834537506103516, "max_norm/layer21": 32.69060516357422, "max_norm/layer22": 33.47240447998047, "max_norm/layer23": 31.775291442871094, "max_norm/layer3": 29.894990921020508, "max_norm/layer4": 29.559480667114258, "max_norm/layer5": 37.756587982177734, "max_norm/layer6": 24.900632858276367, "max_norm/layer7": 32.3841552734375, "max_norm/layer8": 31.64830780029297, "max_norm/layer9": 31.78627586364746, "mean_norm": 11.148543067276478, "mean_norm/layer0": 10.865490138530731, "mean_norm/layer1": 10.602823853492737, "mean_norm/layer10": 10.94576382637024, "mean_norm/layer11": 11.303158342838287, "mean_norm/layer12": 11.949087858200073, "mean_norm/layer13": 10.956337213516235, "mean_norm/layer14": 11.380485773086548, "mean_norm/layer15": 11.765974640846252, "mean_norm/layer16": 11.034591972827911, "mean_norm/layer17": 11.564175546169281, "mean_norm/layer18": 11.04419356584549, "mean_norm/layer19": 11.106570959091187, "mean_norm/layer2": 9.01699161529541, "mean_norm/layer20": 11.21491664648056, "mean_norm/layer21": 11.177606880664825, "mean_norm/layer22": 12.284631669521332, "mean_norm/layer23": 12.233553946018219, "mean_norm/layer3": 11.720988273620605, "mean_norm/layer4": 10.347264647483826, "mean_norm/layer5": 13.080726027488708, "mean_norm/layer6": 9.79598182439804, "mean_norm/layer7": 10.387580871582031, "mean_norm/layer8": 10.933634042739868, "mean_norm/layer9": 10.852503478527069, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11750 }, { "epoch": 4.91, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46984501689360475, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.688762903213501, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6509, "eval_samples_per_second": 20.685, "eval_steps_per_second": 0.687, "step": 11750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.93, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5079, "max_norm": 37.85048294067383, "max_norm/layer0": 29.263450622558594, "max_norm/layer1": 30.939136505126953, "max_norm/layer10": 32.416481018066406, "max_norm/layer11": 30.116899490356445, "max_norm/layer12": 34.24009323120117, "max_norm/layer13": 30.03861427307129, "max_norm/layer14": 31.231199264526367, "max_norm/layer15": 37.69263458251953, "max_norm/layer16": 31.176904678344727, "max_norm/layer17": 37.800819396972656, "max_norm/layer18": 32.89786911010742, "max_norm/layer19": 32.403892517089844, "max_norm/layer2": 23.873645782470703, "max_norm/layer20": 32.9393424987793, "max_norm/layer21": 32.77646255493164, "max_norm/layer22": 33.565677642822266, "max_norm/layer23": 31.855518341064453, "max_norm/layer3": 29.965782165527344, "max_norm/layer4": 29.643163681030273, "max_norm/layer5": 37.85048294067383, "max_norm/layer6": 24.967506408691406, "max_norm/layer7": 32.4691162109375, "max_norm/layer8": 31.7069034576416, "max_norm/layer9": 31.866910934448242, "mean_norm": 11.158328091104826, "mean_norm/layer0": 10.877790868282318, "mean_norm/layer1": 10.612155139446259, "mean_norm/layer10": 10.95480102300644, "mean_norm/layer11": 11.313199162483215, "mean_norm/layer12": 11.961796998977661, "mean_norm/layer13": 10.965710639953613, "mean_norm/layer14": 11.390668153762817, "mean_norm/layer15": 11.77765667438507, "mean_norm/layer16": 11.043775260448456, "mean_norm/layer17": 11.574420154094696, "mean_norm/layer18": 11.052655577659607, "mean_norm/layer19": 11.115290462970734, "mean_norm/layer2": 9.02040845155716, "mean_norm/layer20": 11.223563849925995, "mean_norm/layer21": 11.186604678630829, "mean_norm/layer22": 12.29665869474411, "mean_norm/layer23": 12.245661318302155, "mean_norm/layer3": 11.73361337184906, "mean_norm/layer4": 10.354853808879852, "mean_norm/layer5": 13.097476840019226, "mean_norm/layer6": 9.801718294620514, "mean_norm/layer7": 10.395187497138977, "mean_norm/layer8": 10.942837297916412, "mean_norm/layer9": 10.861369967460632, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11800 }, { "epoch": 4.93, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4696624929525478, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.688814401626587, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8439, "eval_samples_per_second": 20.348, "eval_steps_per_second": 0.675, "step": 11800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.95, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5014, "max_norm": 37.93788528442383, "max_norm/layer0": 29.340675354003906, "max_norm/layer1": 31.018381118774414, "max_norm/layer10": 32.511417388916016, "max_norm/layer11": 30.187868118286133, "max_norm/layer12": 34.35157775878906, "max_norm/layer13": 30.132198333740234, "max_norm/layer14": 31.31639289855957, "max_norm/layer15": 37.80784606933594, "max_norm/layer16": 31.25621795654297, "max_norm/layer17": 37.93748474121094, "max_norm/layer18": 32.988922119140625, "max_norm/layer19": 32.515724182128906, "max_norm/layer2": 23.931446075439453, "max_norm/layer20": 33.02553939819336, "max_norm/layer21": 32.86348342895508, "max_norm/layer22": 33.67148208618164, "max_norm/layer23": 31.935056686401367, "max_norm/layer3": 30.043079376220703, "max_norm/layer4": 29.730466842651367, "max_norm/layer5": 37.93788528442383, "max_norm/layer6": 25.02423667907715, "max_norm/layer7": 32.552818298339844, "max_norm/layer8": 31.76500701904297, "max_norm/layer9": 31.92847442626953, "mean_norm": 11.168228807548681, "mean_norm/layer0": 10.890288770198822, "mean_norm/layer1": 10.62157815694809, "mean_norm/layer10": 10.963908910751343, "mean_norm/layer11": 11.323238909244537, "mean_norm/layer12": 11.974679410457611, "mean_norm/layer13": 10.975349426269531, "mean_norm/layer14": 11.401008605957031, "mean_norm/layer15": 11.789547324180603, "mean_norm/layer16": 11.053157031536102, "mean_norm/layer17": 11.58478707075119, "mean_norm/layer18": 11.061248421669006, "mean_norm/layer19": 11.124230206012726, "mean_norm/layer2": 9.023894667625427, "mean_norm/layer20": 11.232537388801575, "mean_norm/layer21": 11.19556349515915, "mean_norm/layer22": 12.30886971950531, "mean_norm/layer23": 12.257866203784943, "mean_norm/layer3": 11.746358752250671, "mean_norm/layer4": 10.362483322620392, "mean_norm/layer5": 13.114296019077301, "mean_norm/layer6": 9.807480454444885, "mean_norm/layer7": 10.402803540229797, "mean_norm/layer8": 10.952084362506866, "mean_norm/layer9": 10.870231211185455, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11850 }, { "epoch": 4.95, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4705872809205696, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.683215856552124, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6413, "eval_samples_per_second": 20.702, "eval_steps_per_second": 0.687, "step": 11850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.97, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.519, "max_norm": 38.05906295776367, "max_norm/layer0": 29.42703628540039, "max_norm/layer1": 31.089515686035156, "max_norm/layer10": 32.583194732666016, "max_norm/layer11": 30.255687713623047, "max_norm/layer12": 34.46479797363281, "max_norm/layer13": 30.210359573364258, "max_norm/layer14": 31.400686264038086, "max_norm/layer15": 37.92513656616211, "max_norm/layer16": 31.335044860839844, "max_norm/layer17": 38.05906295776367, "max_norm/layer18": 33.082340240478516, "max_norm/layer19": 32.62194061279297, "max_norm/layer2": 24.000274658203125, "max_norm/layer20": 33.11968994140625, "max_norm/layer21": 32.96305847167969, "max_norm/layer22": 33.76947021484375, "max_norm/layer23": 32.0211181640625, "max_norm/layer3": 30.126047134399414, "max_norm/layer4": 29.8212947845459, "max_norm/layer5": 38.0276985168457, "max_norm/layer6": 25.084314346313477, "max_norm/layer7": 32.645408630371094, "max_norm/layer8": 31.83109474182129, "max_norm/layer9": 32.01667022705078, "mean_norm": 11.177929555376371, "mean_norm/layer0": 10.902526676654816, "mean_norm/layer1": 10.630789399147034, "mean_norm/layer10": 10.972841262817383, "mean_norm/layer11": 11.333194494247437, "mean_norm/layer12": 11.987314462661743, "mean_norm/layer13": 10.98465383052826, "mean_norm/layer14": 11.411219239234924, "mean_norm/layer15": 11.801235556602478, "mean_norm/layer16": 11.062246561050415, "mean_norm/layer17": 11.594827890396118, "mean_norm/layer18": 11.069670617580414, "mean_norm/layer19": 11.132874488830566, "mean_norm/layer2": 9.027332544326782, "mean_norm/layer20": 11.241263806819916, "mean_norm/layer21": 11.204251945018768, "mean_norm/layer22": 12.320836007595062, "mean_norm/layer23": 12.269861817359924, "mean_norm/layer3": 11.758853018283844, "mean_norm/layer4": 10.370031774044037, "mean_norm/layer5": 13.130874693393707, "mean_norm/layer6": 9.813177287578583, "mean_norm/layer7": 10.41031789779663, "mean_norm/layer8": 10.961123704910278, "mean_norm/layer9": 10.878990352153778, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11900 }, { "epoch": 4.97, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4704128691546708, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6838083267211914, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6596, "eval_samples_per_second": 20.67, "eval_steps_per_second": 0.686, "step": 11900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 4.99, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.5041, "max_norm": 38.194522857666016, "max_norm/layer0": 29.501251220703125, "max_norm/layer1": 31.155527114868164, "max_norm/layer10": 32.66633224487305, "max_norm/layer11": 30.323793411254883, "max_norm/layer12": 34.57496643066406, "max_norm/layer13": 30.298030853271484, "max_norm/layer14": 31.500028610229492, "max_norm/layer15": 38.035335540771484, "max_norm/layer16": 31.41799545288086, "max_norm/layer17": 38.194522857666016, "max_norm/layer18": 33.178749084472656, "max_norm/layer19": 32.73746109008789, "max_norm/layer2": 24.063013076782227, "max_norm/layer20": 33.205509185791016, "max_norm/layer21": 33.06170654296875, "max_norm/layer22": 33.85256576538086, "max_norm/layer23": 32.10818862915039, "max_norm/layer3": 30.200939178466797, "max_norm/layer4": 29.90153694152832, "max_norm/layer5": 38.12092590332031, "max_norm/layer6": 25.150123596191406, "max_norm/layer7": 32.741180419921875, "max_norm/layer8": 31.89752197265625, "max_norm/layer9": 32.092933654785156, "mean_norm": 11.187665241460005, "mean_norm/layer0": 10.914686381816864, "mean_norm/layer1": 10.640029609203339, "mean_norm/layer10": 10.981725633144379, "mean_norm/layer11": 11.343181252479553, "mean_norm/layer12": 11.999892354011536, "mean_norm/layer13": 10.993940532207489, "mean_norm/layer14": 11.421403646469116, "mean_norm/layer15": 11.812836050987244, "mean_norm/layer16": 11.071481466293335, "mean_norm/layer17": 11.604974210262299, "mean_norm/layer18": 11.078194618225098, "mean_norm/layer19": 11.141615271568298, "mean_norm/layer2": 9.03076058626175, "mean_norm/layer20": 11.250074625015259, "mean_norm/layer21": 11.213150680065155, "mean_norm/layer22": 12.33284342288971, "mean_norm/layer23": 12.281926989555359, "mean_norm/layer3": 11.771265745162964, "mean_norm/layer4": 10.37760877609253, "mean_norm/layer5": 13.147468388080597, "mean_norm/layer6": 9.818911015987396, "mean_norm/layer7": 10.417860507965088, "mean_norm/layer8": 10.970265984535217, "mean_norm/layer9": 10.887868046760559, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 11950 }, { "epoch": 4.99, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4704534300304612, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6852517127990723, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6451, "eval_samples_per_second": 20.695, "eval_steps_per_second": 0.687, "step": 11950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.01, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3794, "max_norm": 38.302860260009766, "max_norm/layer0": 29.574535369873047, "max_norm/layer1": 31.22898292541504, "max_norm/layer10": 32.7488899230957, "max_norm/layer11": 30.39142608642578, "max_norm/layer12": 34.67290496826172, "max_norm/layer13": 30.389312744140625, "max_norm/layer14": 31.585010528564453, "max_norm/layer15": 38.15389633178711, "max_norm/layer16": 31.482175827026367, "max_norm/layer17": 38.302860260009766, "max_norm/layer18": 33.27186965942383, "max_norm/layer19": 32.84207534790039, "max_norm/layer2": 24.129867553710938, "max_norm/layer20": 33.300254821777344, "max_norm/layer21": 33.150123596191406, "max_norm/layer22": 33.929691314697266, "max_norm/layer23": 32.196044921875, "max_norm/layer3": 30.272613525390625, "max_norm/layer4": 29.979124069213867, "max_norm/layer5": 38.213741302490234, "max_norm/layer6": 25.21087074279785, "max_norm/layer7": 32.830772399902344, "max_norm/layer8": 31.961711883544922, "max_norm/layer9": 32.1682243347168, "mean_norm": 11.19739151497682, "mean_norm/layer0": 10.926727831363678, "mean_norm/layer1": 10.64928013086319, "mean_norm/layer10": 10.990540206432343, "mean_norm/layer11": 11.35308039188385, "mean_norm/layer12": 12.012557685375214, "mean_norm/layer13": 11.003331005573273, "mean_norm/layer14": 11.4315704703331, "mean_norm/layer15": 11.824599802494049, "mean_norm/layer16": 11.080740988254547, "mean_norm/layer17": 11.61514014005661, "mean_norm/layer18": 11.086707293987274, "mean_norm/layer19": 11.150398910045624, "mean_norm/layer2": 9.034183740615845, "mean_norm/layer20": 11.259066879749298, "mean_norm/layer21": 11.222183465957642, "mean_norm/layer22": 12.344780445098877, "mean_norm/layer23": 12.294032156467438, "mean_norm/layer3": 11.783682465553284, "mean_norm/layer4": 10.38510811328888, "mean_norm/layer5": 13.16391259431839, "mean_norm/layer6": 9.824450016021729, "mean_norm/layer7": 10.425398409366608, "mean_norm/layer8": 10.979355573654175, "mean_norm/layer9": 10.896567642688751, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12000 }, { "epoch": 5.01, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46842944232851874, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.722437858581543, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6518, "eval_samples_per_second": 20.684, "eval_steps_per_second": 0.687, "step": 12000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.03, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3033, "max_norm": 38.435333251953125, "max_norm/layer0": 29.649662017822266, "max_norm/layer1": 31.303651809692383, "max_norm/layer10": 32.83454895019531, "max_norm/layer11": 30.47419548034668, "max_norm/layer12": 34.7756462097168, "max_norm/layer13": 30.48672103881836, "max_norm/layer14": 31.663904190063477, "max_norm/layer15": 38.27345657348633, "max_norm/layer16": 31.572792053222656, "max_norm/layer17": 38.435333251953125, "max_norm/layer18": 33.37535095214844, "max_norm/layer19": 32.94023895263672, "max_norm/layer2": 24.199243545532227, "max_norm/layer20": 33.396766662597656, "max_norm/layer21": 33.266395568847656, "max_norm/layer22": 34.011863708496094, "max_norm/layer23": 32.28325653076172, "max_norm/layer3": 30.342016220092773, "max_norm/layer4": 30.060850143432617, "max_norm/layer5": 38.307411193847656, "max_norm/layer6": 25.27783203125, "max_norm/layer7": 32.91995620727539, "max_norm/layer8": 32.02895736694336, "max_norm/layer9": 32.24490737915039, "mean_norm": 11.207477805515131, "mean_norm/layer0": 10.939489781856537, "mean_norm/layer1": 10.658688187599182, "mean_norm/layer10": 10.99948763847351, "mean_norm/layer11": 11.363388180732727, "mean_norm/layer12": 12.025580883026123, "mean_norm/layer13": 11.013049066066742, "mean_norm/layer14": 11.442092716693878, "mean_norm/layer15": 11.836634337902069, "mean_norm/layer16": 11.090266406536102, "mean_norm/layer17": 11.625772356987, "mean_norm/layer18": 11.095670282840729, "mean_norm/layer19": 11.15985506772995, "mean_norm/layer2": 9.037715494632721, "mean_norm/layer20": 11.268753230571747, "mean_norm/layer21": 11.231657326221466, "mean_norm/layer22": 12.357149720191956, "mean_norm/layer23": 12.30664312839508, "mean_norm/layer3": 11.796434462070465, "mean_norm/layer4": 10.392972588539124, "mean_norm/layer5": 13.180622637271881, "mean_norm/layer6": 9.830242931842804, "mean_norm/layer7": 10.433066010475159, "mean_norm/layer8": 10.988660275936127, "mean_norm/layer9": 10.90557461977005, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12050 }, { "epoch": 5.03, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46702197993859085, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7288458347320557, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.849, "eval_samples_per_second": 20.339, "eval_steps_per_second": 0.675, "step": 12050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.05, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3092, "max_norm": 38.57270812988281, "max_norm/layer0": 29.720144271850586, "max_norm/layer1": 31.386343002319336, "max_norm/layer10": 32.91311264038086, "max_norm/layer11": 30.554622650146484, "max_norm/layer12": 34.88260269165039, "max_norm/layer13": 30.58049774169922, "max_norm/layer14": 31.75419044494629, "max_norm/layer15": 38.385005950927734, "max_norm/layer16": 31.658222198486328, "max_norm/layer17": 38.57270812988281, "max_norm/layer18": 33.51114273071289, "max_norm/layer19": 33.040367126464844, "max_norm/layer2": 24.25741195678711, "max_norm/layer20": 33.488975524902344, "max_norm/layer21": 33.363487243652344, "max_norm/layer22": 34.08940505981445, "max_norm/layer23": 32.368831634521484, "max_norm/layer3": 30.41705894470215, "max_norm/layer4": 30.137144088745117, "max_norm/layer5": 38.41334533691406, "max_norm/layer6": 25.35138702392578, "max_norm/layer7": 33.001834869384766, "max_norm/layer8": 32.105072021484375, "max_norm/layer9": 32.34452438354492, "mean_norm": 11.21775616457065, "mean_norm/layer0": 10.952854812145233, "mean_norm/layer1": 10.668235659599304, "mean_norm/layer10": 11.008642077445984, "mean_norm/layer11": 11.373880326747894, "mean_norm/layer12": 12.038914799690247, "mean_norm/layer13": 11.02297329902649, "mean_norm/layer14": 11.452847063541412, "mean_norm/layer15": 11.848887979984283, "mean_norm/layer16": 11.099906980991364, "mean_norm/layer17": 11.636568486690521, "mean_norm/layer18": 11.10478299856186, "mean_norm/layer19": 11.169407188892365, "mean_norm/layer2": 9.04135924577713, "mean_norm/layer20": 11.278404533863068, "mean_norm/layer21": 11.241189360618591, "mean_norm/layer22": 12.369754791259766, "mean_norm/layer23": 12.31940084695816, "mean_norm/layer3": 11.80949753522873, "mean_norm/layer4": 10.400984764099121, "mean_norm/layer5": 13.19771432876587, "mean_norm/layer6": 9.83626252412796, "mean_norm/layer7": 10.44089788198471, "mean_norm/layer8": 10.998125731945038, "mean_norm/layer9": 10.914654731750488, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12100 }, { "epoch": 5.05, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46599173369351393, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7484076023101807, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8461, "eval_samples_per_second": 20.344, "eval_steps_per_second": 0.675, "step": 12100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.07, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3214, "max_norm": 38.711116790771484, "max_norm/layer0": 29.78860092163086, "max_norm/layer1": 31.47394561767578, "max_norm/layer10": 33.007537841796875, "max_norm/layer11": 30.644929885864258, "max_norm/layer12": 34.98715591430664, "max_norm/layer13": 30.685518264770508, "max_norm/layer14": 31.84963035583496, "max_norm/layer15": 38.483680725097656, "max_norm/layer16": 31.737163543701172, "max_norm/layer17": 38.711116790771484, "max_norm/layer18": 33.6363639831543, "max_norm/layer19": 33.14191818237305, "max_norm/layer2": 24.332351684570312, "max_norm/layer20": 33.56949234008789, "max_norm/layer21": 33.465484619140625, "max_norm/layer22": 34.195106506347656, "max_norm/layer23": 32.45437240600586, "max_norm/layer3": 30.49375343322754, "max_norm/layer4": 30.231184005737305, "max_norm/layer5": 38.51918029785156, "max_norm/layer6": 25.419851303100586, "max_norm/layer7": 33.08552551269531, "max_norm/layer8": 32.17802810668945, "max_norm/layer9": 32.42779541015625, "mean_norm": 11.228026956319809, "mean_norm/layer0": 10.966456592082977, "mean_norm/layer1": 10.677858173847198, "mean_norm/layer10": 11.017882645130157, "mean_norm/layer11": 11.384362578392029, "mean_norm/layer12": 12.052213430404663, "mean_norm/layer13": 11.032799184322357, "mean_norm/layer14": 11.463645279407501, "mean_norm/layer15": 11.861131072044373, "mean_norm/layer16": 11.109526216983795, "mean_norm/layer17": 11.647267878055573, "mean_norm/layer18": 11.113752365112305, "mean_norm/layer19": 11.178877294063568, "mean_norm/layer2": 9.04505831003189, "mean_norm/layer20": 11.28793090581894, "mean_norm/layer21": 11.250765681266785, "mean_norm/layer22": 12.382255971431732, "mean_norm/layer23": 12.33215218782425, "mean_norm/layer3": 11.82255333662033, "mean_norm/layer4": 10.40901243686676, "mean_norm/layer5": 13.214745044708252, "mean_norm/layer6": 9.842304766178131, "mean_norm/layer7": 10.448727905750275, "mean_norm/layer8": 11.007568538188934, "mean_norm/layer9": 10.92379915714264, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12150 }, { "epoch": 5.07, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4671112138653298, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7360055446624756, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6542, "eval_samples_per_second": 20.679, "eval_steps_per_second": 0.686, "step": 12150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.09, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3385, "max_norm": 38.83620834350586, "max_norm/layer0": 29.86420440673828, "max_norm/layer1": 31.559425354003906, "max_norm/layer10": 33.10588073730469, "max_norm/layer11": 30.738574981689453, "max_norm/layer12": 35.08659362792969, "max_norm/layer13": 30.78911781311035, "max_norm/layer14": 31.945295333862305, "max_norm/layer15": 38.5927848815918, "max_norm/layer16": 31.82872200012207, "max_norm/layer17": 38.83620834350586, "max_norm/layer18": 33.7295036315918, "max_norm/layer19": 33.2426643371582, "max_norm/layer2": 24.397293090820312, "max_norm/layer20": 33.64811706542969, "max_norm/layer21": 33.56774139404297, "max_norm/layer22": 34.284812927246094, "max_norm/layer23": 32.54706954956055, "max_norm/layer3": 30.576663970947266, "max_norm/layer4": 30.337905883789062, "max_norm/layer5": 38.61861038208008, "max_norm/layer6": 25.4854736328125, "max_norm/layer7": 33.1692008972168, "max_norm/layer8": 32.24501419067383, "max_norm/layer9": 32.51561737060547, "mean_norm": 11.23827119419972, "mean_norm/layer0": 10.980204999446869, "mean_norm/layer1": 10.687390863895416, "mean_norm/layer10": 11.027082443237305, "mean_norm/layer11": 11.394726574420929, "mean_norm/layer12": 12.06546550989151, "mean_norm/layer13": 11.042561769485474, "mean_norm/layer14": 11.474426746368408, "mean_norm/layer15": 11.873374342918396, "mean_norm/layer16": 11.119168400764465, "mean_norm/layer17": 11.657908141613007, "mean_norm/layer18": 11.122701942920685, "mean_norm/layer19": 11.188299894332886, "mean_norm/layer2": 9.04871541261673, "mean_norm/layer20": 11.297274112701416, "mean_norm/layer21": 11.260233700275421, "mean_norm/layer22": 12.394688069820404, "mean_norm/layer23": 12.344739496707916, "mean_norm/layer3": 11.835649728775024, "mean_norm/layer4": 10.417012393474579, "mean_norm/layer5": 13.231845915317535, "mean_norm/layer6": 9.848419427871704, "mean_norm/layer7": 10.456669807434082, "mean_norm/layer8": 11.017016351222992, "mean_norm/layer9": 10.932932615280151, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12200 }, { "epoch": 5.09, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4663283889625745, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7343714237213135, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8312, "eval_samples_per_second": 20.37, "eval_steps_per_second": 0.676, "step": 12200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.11, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3454, "max_norm": 38.94695281982422, "max_norm/layer0": 29.94550895690918, "max_norm/layer1": 31.643796920776367, "max_norm/layer10": 33.20231246948242, "max_norm/layer11": 30.815670013427734, "max_norm/layer12": 35.189117431640625, "max_norm/layer13": 30.878437042236328, "max_norm/layer14": 32.03306198120117, "max_norm/layer15": 38.69236373901367, "max_norm/layer16": 31.911941528320312, "max_norm/layer17": 38.94695281982422, "max_norm/layer18": 33.80670928955078, "max_norm/layer19": 33.32986068725586, "max_norm/layer2": 24.444849014282227, "max_norm/layer20": 33.73457717895508, "max_norm/layer21": 33.681278228759766, "max_norm/layer22": 34.373939514160156, "max_norm/layer23": 32.62388229370117, "max_norm/layer3": 30.654300689697266, "max_norm/layer4": 30.43708038330078, "max_norm/layer5": 38.72135925292969, "max_norm/layer6": 25.56049156188965, "max_norm/layer7": 33.244224548339844, "max_norm/layer8": 32.313419342041016, "max_norm/layer9": 32.6116943359375, "mean_norm": 11.248527511954308, "mean_norm/layer0": 10.99410879611969, "mean_norm/layer1": 10.696984589099884, "mean_norm/layer10": 11.036336183547974, "mean_norm/layer11": 11.405112087726593, "mean_norm/layer12": 12.078685998916626, "mean_norm/layer13": 11.052375078201294, "mean_norm/layer14": 11.485212564468384, "mean_norm/layer15": 11.88576340675354, "mean_norm/layer16": 11.128781139850616, "mean_norm/layer17": 11.668495118618011, "mean_norm/layer18": 11.131764531135559, "mean_norm/layer19": 11.197697877883911, "mean_norm/layer2": 9.05235469341278, "mean_norm/layer20": 11.306506991386414, "mean_norm/layer21": 11.269656121730804, "mean_norm/layer22": 12.406981706619263, "mean_norm/layer23": 12.357316255569458, "mean_norm/layer3": 11.848814308643341, "mean_norm/layer4": 10.424997925758362, "mean_norm/layer5": 13.248937249183655, "mean_norm/layer6": 9.85450428724289, "mean_norm/layer7": 10.464615046977997, "mean_norm/layer8": 11.02652508020401, "mean_norm/layer9": 10.942133247852325, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12250 }, { "epoch": 5.11, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4667056051074255, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.738703489303589, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8467, "eval_samples_per_second": 20.343, "eval_steps_per_second": 0.675, "step": 12250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.14, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3659, "max_norm": 39.07551956176758, "max_norm/layer0": 30.023889541625977, "max_norm/layer1": 31.72894287109375, "max_norm/layer10": 33.298709869384766, "max_norm/layer11": 30.895883560180664, "max_norm/layer12": 35.28593444824219, "max_norm/layer13": 30.964996337890625, "max_norm/layer14": 32.12107849121094, "max_norm/layer15": 38.7972412109375, "max_norm/layer16": 32.01172637939453, "max_norm/layer17": 39.07551956176758, "max_norm/layer18": 33.89895248413086, "max_norm/layer19": 33.43098449707031, "max_norm/layer2": 24.488872528076172, "max_norm/layer20": 33.816402435302734, "max_norm/layer21": 33.77363586425781, "max_norm/layer22": 34.466548919677734, "max_norm/layer23": 32.704017639160156, "max_norm/layer3": 30.721336364746094, "max_norm/layer4": 30.511106491088867, "max_norm/layer5": 38.81980895996094, "max_norm/layer6": 25.633987426757812, "max_norm/layer7": 33.3271598815918, "max_norm/layer8": 32.375736236572266, "max_norm/layer9": 32.68894958496094, "mean_norm": 11.258795611560345, "mean_norm/layer0": 11.00811630487442, "mean_norm/layer1": 10.706629991531372, "mean_norm/layer10": 11.045571565628052, "mean_norm/layer11": 11.415521442890167, "mean_norm/layer12": 12.091852962970734, "mean_norm/layer13": 11.062187731266022, "mean_norm/layer14": 11.495945274829865, "mean_norm/layer15": 11.898083865642548, "mean_norm/layer16": 11.138496458530426, "mean_norm/layer17": 11.679109454154968, "mean_norm/layer18": 11.14063447713852, "mean_norm/layer19": 11.207036793231964, "mean_norm/layer2": 9.056014776229858, "mean_norm/layer20": 11.315796852111816, "mean_norm/layer21": 11.279004096984863, "mean_norm/layer22": 12.419390439987183, "mean_norm/layer23": 12.369924485683441, "mean_norm/layer3": 11.862018048763275, "mean_norm/layer4": 10.433027982711792, "mean_norm/layer5": 13.266180872917175, "mean_norm/layer6": 9.860602617263794, "mean_norm/layer7": 10.472546875476837, "mean_norm/layer8": 11.036045849323273, "mean_norm/layer9": 10.951355457305908, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12300 }, { "epoch": 5.14, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46643790332720864, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.738595724105835, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8552, "eval_samples_per_second": 20.329, "eval_steps_per_second": 0.675, "step": 12300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.16, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3723, "max_norm": 39.21499252319336, "max_norm/layer0": 30.096342086791992, "max_norm/layer1": 31.81536293029785, "max_norm/layer10": 33.39365005493164, "max_norm/layer11": 30.970529556274414, "max_norm/layer12": 35.38508605957031, "max_norm/layer13": 31.051616668701172, "max_norm/layer14": 32.2015266418457, "max_norm/layer15": 38.904335021972656, "max_norm/layer16": 32.10439682006836, "max_norm/layer17": 39.21499252319336, "max_norm/layer18": 33.9943733215332, "max_norm/layer19": 33.54290771484375, "max_norm/layer2": 24.53144645690918, "max_norm/layer20": 33.91130065917969, "max_norm/layer21": 33.88111114501953, "max_norm/layer22": 34.56108093261719, "max_norm/layer23": 32.789222717285156, "max_norm/layer3": 30.79220962524414, "max_norm/layer4": 30.591642379760742, "max_norm/layer5": 38.921443939208984, "max_norm/layer6": 25.69824981689453, "max_norm/layer7": 33.40739440917969, "max_norm/layer8": 32.45912551879883, "max_norm/layer9": 32.77835464477539, "mean_norm": 11.269128928581873, "mean_norm/layer0": 11.022284209728241, "mean_norm/layer1": 10.716285347938538, "mean_norm/layer10": 11.054743885993958, "mean_norm/layer11": 11.426034033298492, "mean_norm/layer12": 12.105147123336792, "mean_norm/layer13": 11.072054088115692, "mean_norm/layer14": 11.506755590438843, "mean_norm/layer15": 11.91039365530014, "mean_norm/layer16": 11.14819085597992, "mean_norm/layer17": 11.689731240272522, "mean_norm/layer18": 11.149564683437347, "mean_norm/layer19": 11.216427028179169, "mean_norm/layer2": 9.059784173965454, "mean_norm/layer20": 11.325107753276825, "mean_norm/layer21": 11.28848946094513, "mean_norm/layer22": 12.431827366352081, "mean_norm/layer23": 12.38248485326767, "mean_norm/layer3": 11.875406265258789, "mean_norm/layer4": 10.441197097301483, "mean_norm/layer5": 13.283584535121918, "mean_norm/layer6": 9.866783261299133, "mean_norm/layer7": 10.480609238147736, "mean_norm/layer8": 11.04563707113266, "mean_norm/layer9": 10.960571467876434, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12350 }, { "epoch": 5.16, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46718422344175253, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7359020709991455, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8471, "eval_samples_per_second": 20.342, "eval_steps_per_second": 0.675, "step": 12350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.18, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3804, "max_norm": 39.340614318847656, "max_norm/layer0": 30.16893196105957, "max_norm/layer1": 31.899879455566406, "max_norm/layer10": 33.48374557495117, "max_norm/layer11": 31.040555953979492, "max_norm/layer12": 35.49278259277344, "max_norm/layer13": 31.146411895751953, "max_norm/layer14": 32.291934967041016, "max_norm/layer15": 39.00080108642578, "max_norm/layer16": 32.20722198486328, "max_norm/layer17": 39.340614318847656, "max_norm/layer18": 34.10038757324219, "max_norm/layer19": 33.632362365722656, "max_norm/layer2": 24.594600677490234, "max_norm/layer20": 33.99564743041992, "max_norm/layer21": 33.98853302001953, "max_norm/layer22": 34.644447326660156, "max_norm/layer23": 32.86933135986328, "max_norm/layer3": 30.86780548095703, "max_norm/layer4": 30.658416748046875, "max_norm/layer5": 39.01528549194336, "max_norm/layer6": 25.761075973510742, "max_norm/layer7": 33.47981643676758, "max_norm/layer8": 32.54744338989258, "max_norm/layer9": 32.88261413574219, "mean_norm": 11.279446867605051, "mean_norm/layer0": 11.036405384540558, "mean_norm/layer1": 10.72603064775467, "mean_norm/layer10": 11.063933193683624, "mean_norm/layer11": 11.436520993709564, "mean_norm/layer12": 12.118435442447662, "mean_norm/layer13": 11.082020878791809, "mean_norm/layer14": 11.517515301704407, "mean_norm/layer15": 11.922657191753387, "mean_norm/layer16": 11.157944202423096, "mean_norm/layer17": 11.700325787067413, "mean_norm/layer18": 11.158488869667053, "mean_norm/layer19": 11.225876986980438, "mean_norm/layer2": 9.06354033946991, "mean_norm/layer20": 11.334345400333405, "mean_norm/layer21": 11.297895312309265, "mean_norm/layer22": 12.444255292415619, "mean_norm/layer23": 12.39496910572052, "mean_norm/layer3": 11.888732671737671, "mean_norm/layer4": 10.449354648590088, "mean_norm/layer5": 13.300997972488403, "mean_norm/layer6": 9.872974157333374, "mean_norm/layer7": 10.488583147525787, "mean_norm/layer8": 11.055160284042358, "mean_norm/layer9": 10.969761610031128, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12400 }, { "epoch": 5.18, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46694897036216804, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7420947551727295, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8371, "eval_samples_per_second": 20.36, "eval_steps_per_second": 0.676, "step": 12400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.2, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.374, "max_norm": 39.4640998840332, "max_norm/layer0": 30.24111557006836, "max_norm/layer1": 31.98891830444336, "max_norm/layer10": 33.58835983276367, "max_norm/layer11": 31.11510467529297, "max_norm/layer12": 35.58452224731445, "max_norm/layer13": 31.24594497680664, "max_norm/layer14": 32.39015579223633, "max_norm/layer15": 39.09994888305664, "max_norm/layer16": 32.305450439453125, "max_norm/layer17": 39.4640998840332, "max_norm/layer18": 34.1920166015625, "max_norm/layer19": 33.718265533447266, "max_norm/layer2": 24.64690589904785, "max_norm/layer20": 34.07452392578125, "max_norm/layer21": 34.084495544433594, "max_norm/layer22": 34.735374450683594, "max_norm/layer23": 32.95333480834961, "max_norm/layer3": 30.938343048095703, "max_norm/layer4": 30.739850997924805, "max_norm/layer5": 39.114383697509766, "max_norm/layer6": 25.823427200317383, "max_norm/layer7": 33.55558395385742, "max_norm/layer8": 32.629051208496094, "max_norm/layer9": 32.965084075927734, "mean_norm": 11.289606223503748, "mean_norm/layer0": 11.050397753715515, "mean_norm/layer1": 10.735670387744904, "mean_norm/layer10": 11.073055744171143, "mean_norm/layer11": 11.446790933609009, "mean_norm/layer12": 12.131577014923096, "mean_norm/layer13": 11.091777503490448, "mean_norm/layer14": 11.528154075145721, "mean_norm/layer15": 11.934624075889587, "mean_norm/layer16": 11.167495727539062, "mean_norm/layer17": 11.710758984088898, "mean_norm/layer18": 11.16724556684494, "mean_norm/layer19": 11.23505425453186, "mean_norm/layer2": 9.067234516143799, "mean_norm/layer20": 11.343270659446716, "mean_norm/layer21": 11.307054281234741, "mean_norm/layer22": 12.456541776657104, "mean_norm/layer23": 12.407329261302948, "mean_norm/layer3": 11.901857256889343, "mean_norm/layer4": 10.45742917060852, "mean_norm/layer5": 13.318169116973877, "mean_norm/layer6": 9.879100859165192, "mean_norm/layer7": 10.496457755565643, "mean_norm/layer8": 11.064581274986267, "mean_norm/layer9": 10.97892141342163, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12450 }, { "epoch": 5.2, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46639734245141823, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.733039379119873, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8446, "eval_samples_per_second": 20.347, "eval_steps_per_second": 0.675, "step": 12450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.22, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3609, "max_norm": 39.59554672241211, "max_norm/layer0": 30.308876037597656, "max_norm/layer1": 32.06950378417969, "max_norm/layer10": 33.700904846191406, "max_norm/layer11": 31.186481475830078, "max_norm/layer12": 35.678646087646484, "max_norm/layer13": 31.349061965942383, "max_norm/layer14": 32.47747039794922, "max_norm/layer15": 39.23009490966797, "max_norm/layer16": 32.39930725097656, "max_norm/layer17": 39.59554672241211, "max_norm/layer18": 34.284759521484375, "max_norm/layer19": 33.8138313293457, "max_norm/layer2": 24.689485549926758, "max_norm/layer20": 34.164310455322266, "max_norm/layer21": 34.197967529296875, "max_norm/layer22": 34.82883834838867, "max_norm/layer23": 33.03238296508789, "max_norm/layer3": 31.01808738708496, "max_norm/layer4": 30.82036590576172, "max_norm/layer5": 39.21382522583008, "max_norm/layer6": 25.887048721313477, "max_norm/layer7": 33.6284065246582, "max_norm/layer8": 32.720245361328125, "max_norm/layer9": 33.05253601074219, "mean_norm": 11.29996439566215, "mean_norm/layer0": 11.064708232879639, "mean_norm/layer1": 10.745510697364807, "mean_norm/layer10": 11.082452714443207, "mean_norm/layer11": 11.457266986370087, "mean_norm/layer12": 12.14503288269043, "mean_norm/layer13": 11.101730048656464, "mean_norm/layer14": 11.539036452770233, "mean_norm/layer15": 11.946848630905151, "mean_norm/layer16": 11.177112400531769, "mean_norm/layer17": 11.721317291259766, "mean_norm/layer18": 11.176118850708008, "mean_norm/layer19": 11.24438202381134, "mean_norm/layer2": 9.071042716503143, "mean_norm/layer20": 11.352453172206879, "mean_norm/layer21": 11.316423892974854, "mean_norm/layer22": 12.468946397304535, "mean_norm/layer23": 12.419977307319641, "mean_norm/layer3": 11.915303409099579, "mean_norm/layer4": 10.465545892715454, "mean_norm/layer5": 13.335692644119263, "mean_norm/layer6": 9.885368764400482, "mean_norm/layer7": 10.50448876619339, "mean_norm/layer8": 11.074171483516693, "mean_norm/layer9": 10.988213837146759, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12500 }, { "epoch": 5.22, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46689218513606145, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7314534187316895, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.652, "eval_samples_per_second": 20.683, "eval_steps_per_second": 0.687, "step": 12500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.24, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3862, "max_norm": 39.70277404785156, "max_norm/layer0": 30.38404083251953, "max_norm/layer1": 32.14478302001953, "max_norm/layer10": 33.805885314941406, "max_norm/layer11": 31.260480880737305, "max_norm/layer12": 35.794734954833984, "max_norm/layer13": 31.43575096130371, "max_norm/layer14": 32.58359909057617, "max_norm/layer15": 39.35628128051758, "max_norm/layer16": 32.494712829589844, "max_norm/layer17": 39.70277404785156, "max_norm/layer18": 34.3810920715332, "max_norm/layer19": 33.91523361206055, "max_norm/layer2": 24.739246368408203, "max_norm/layer20": 34.25129699707031, "max_norm/layer21": 34.31393051147461, "max_norm/layer22": 34.92304611206055, "max_norm/layer23": 33.12150573730469, "max_norm/layer3": 31.105815887451172, "max_norm/layer4": 30.906110763549805, "max_norm/layer5": 39.31342697143555, "max_norm/layer6": 25.954769134521484, "max_norm/layer7": 33.6923713684082, "max_norm/layer8": 32.806705474853516, "max_norm/layer9": 33.13435745239258, "mean_norm": 11.310173459351063, "mean_norm/layer0": 11.078775227069855, "mean_norm/layer1": 10.755265414714813, "mean_norm/layer10": 11.091667652130127, "mean_norm/layer11": 11.467542886734009, "mean_norm/layer12": 12.158098638057709, "mean_norm/layer13": 11.111486971378326, "mean_norm/layer14": 11.549628913402557, "mean_norm/layer15": 11.958956837654114, "mean_norm/layer16": 11.186640977859497, "mean_norm/layer17": 11.731778621673584, "mean_norm/layer18": 11.184843063354492, "mean_norm/layer19": 11.253638625144958, "mean_norm/layer2": 9.074791491031647, "mean_norm/layer20": 11.361482739448547, "mean_norm/layer21": 11.32561457157135, "mean_norm/layer22": 12.481294214725494, "mean_norm/layer23": 12.432406663894653, "mean_norm/layer3": 11.928609669208527, "mean_norm/layer4": 10.473615765571594, "mean_norm/layer5": 13.353126347064972, "mean_norm/layer6": 9.891473472118378, "mean_norm/layer7": 10.512412011623383, "mean_norm/layer8": 11.083585619926453, "mean_norm/layer9": 10.997426629066467, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12550 }, { "epoch": 5.24, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46764661742576347, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.731708288192749, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8512, "eval_samples_per_second": 20.335, "eval_steps_per_second": 0.675, "step": 12550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.26, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3884, "max_norm": 39.81848907470703, "max_norm/layer0": 30.465442657470703, "max_norm/layer1": 32.21744155883789, "max_norm/layer10": 33.90283203125, "max_norm/layer11": 31.341875076293945, "max_norm/layer12": 35.89216995239258, "max_norm/layer13": 31.522750854492188, "max_norm/layer14": 32.66755676269531, "max_norm/layer15": 39.477203369140625, "max_norm/layer16": 32.581642150878906, "max_norm/layer17": 39.81848907470703, "max_norm/layer18": 34.4770393371582, "max_norm/layer19": 34.00304412841797, "max_norm/layer2": 24.784198760986328, "max_norm/layer20": 34.34490966796875, "max_norm/layer21": 34.41489791870117, "max_norm/layer22": 35.03091812133789, "max_norm/layer23": 33.20782470703125, "max_norm/layer3": 31.18351173400879, "max_norm/layer4": 30.99317169189453, "max_norm/layer5": 39.4189567565918, "max_norm/layer6": 26.01103401184082, "max_norm/layer7": 33.767051696777344, "max_norm/layer8": 32.885719299316406, "max_norm/layer9": 33.21125793457031, "mean_norm": 11.320386427144209, "mean_norm/layer0": 11.092981338500977, "mean_norm/layer1": 10.765110731124878, "mean_norm/layer10": 11.1008420586586, "mean_norm/layer11": 11.477921664714813, "mean_norm/layer12": 12.171100318431854, "mean_norm/layer13": 11.121250987052917, "mean_norm/layer14": 11.560356736183167, "mean_norm/layer15": 11.971032798290253, "mean_norm/layer16": 11.196124851703644, "mean_norm/layer17": 11.742257952690125, "mean_norm/layer18": 11.193524301052094, "mean_norm/layer19": 11.262769341468811, "mean_norm/layer2": 9.07853776216507, "mean_norm/layer20": 11.370389938354492, "mean_norm/layer21": 11.334768116474152, "mean_norm/layer22": 12.493632674217224, "mean_norm/layer23": 12.444727778434753, "mean_norm/layer3": 11.94198340177536, "mean_norm/layer4": 10.481647431850433, "mean_norm/layer5": 13.370624423027039, "mean_norm/layer6": 9.897690117359161, "mean_norm/layer7": 10.52032458782196, "mean_norm/layer8": 11.093088150024414, "mean_norm/layer9": 11.006586790084839, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12600 }, { "epoch": 5.26, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4682955914384103, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7252254486083984, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8473, "eval_samples_per_second": 20.342, "eval_steps_per_second": 0.675, "step": 12600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.28, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4032, "max_norm": 39.929420471191406, "max_norm/layer0": 30.548931121826172, "max_norm/layer1": 32.29167175292969, "max_norm/layer10": 34.00247573852539, "max_norm/layer11": 31.41254997253418, "max_norm/layer12": 35.99769973754883, "max_norm/layer13": 31.61075210571289, "max_norm/layer14": 32.75844192504883, "max_norm/layer15": 39.58732986450195, "max_norm/layer16": 32.66705322265625, "max_norm/layer17": 39.929420471191406, "max_norm/layer18": 34.565277099609375, "max_norm/layer19": 34.10858917236328, "max_norm/layer2": 24.823476791381836, "max_norm/layer20": 34.442203521728516, "max_norm/layer21": 34.50871658325195, "max_norm/layer22": 35.11521530151367, "max_norm/layer23": 33.29035186767578, "max_norm/layer3": 31.250028610229492, "max_norm/layer4": 31.078842163085938, "max_norm/layer5": 39.521339416503906, "max_norm/layer6": 26.063798904418945, "max_norm/layer7": 33.84354782104492, "max_norm/layer8": 32.952308654785156, "max_norm/layer9": 33.28911209106445, "mean_norm": 11.33057057360808, "mean_norm/layer0": 11.107169270515442, "mean_norm/layer1": 10.774906635284424, "mean_norm/layer10": 11.110038161277771, "mean_norm/layer11": 11.488389551639557, "mean_norm/layer12": 12.184193432331085, "mean_norm/layer13": 11.13099753856659, "mean_norm/layer14": 11.571000754833221, "mean_norm/layer15": 11.983158111572266, "mean_norm/layer16": 11.205597698688507, "mean_norm/layer17": 11.75269091129303, "mean_norm/layer18": 11.20217877626419, "mean_norm/layer19": 11.271834790706635, "mean_norm/layer2": 9.082184433937073, "mean_norm/layer20": 11.379377901554108, "mean_norm/layer21": 11.343716561794281, "mean_norm/layer22": 12.505850672721863, "mean_norm/layer23": 12.457082509994507, "mean_norm/layer3": 11.95522665977478, "mean_norm/layer4": 10.489646911621094, "mean_norm/layer5": 13.388073563575745, "mean_norm/layer6": 9.903882265090942, "mean_norm/layer7": 10.528180718421936, "mean_norm/layer8": 11.102473735809326, "mean_norm/layer9": 11.015842199325562, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12650 }, { "epoch": 5.28, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46865252714536615, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7251226902008057, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8478, "eval_samples_per_second": 20.341, "eval_steps_per_second": 0.675, "step": 12650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.3, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3873, "max_norm": 40.05979919433594, "max_norm/layer0": 30.627132415771484, "max_norm/layer1": 32.355186462402344, "max_norm/layer10": 34.118804931640625, "max_norm/layer11": 31.481056213378906, "max_norm/layer12": 36.096923828125, "max_norm/layer13": 31.706356048583984, "max_norm/layer14": 32.84482192993164, "max_norm/layer15": 39.70392608642578, "max_norm/layer16": 32.7635498046875, "max_norm/layer17": 40.05979919433594, "max_norm/layer18": 34.661746978759766, "max_norm/layer19": 34.22161102294922, "max_norm/layer2": 24.860652923583984, "max_norm/layer20": 34.532554626464844, "max_norm/layer21": 34.61908721923828, "max_norm/layer22": 35.19852066040039, "max_norm/layer23": 33.36899185180664, "max_norm/layer3": 31.320377349853516, "max_norm/layer4": 31.162757873535156, "max_norm/layer5": 39.61590576171875, "max_norm/layer6": 26.116485595703125, "max_norm/layer7": 33.92621994018555, "max_norm/layer8": 33.02066421508789, "max_norm/layer9": 33.36391830444336, "mean_norm": 11.340739885965982, "mean_norm/layer0": 11.121292233467102, "mean_norm/layer1": 10.784716546535492, "mean_norm/layer10": 11.11919617652893, "mean_norm/layer11": 11.498693943023682, "mean_norm/layer12": 12.19723129272461, "mean_norm/layer13": 11.140634655952454, "mean_norm/layer14": 11.581675231456757, "mean_norm/layer15": 11.995171904563904, "mean_norm/layer16": 11.215030312538147, "mean_norm/layer17": 11.763100147247314, "mean_norm/layer18": 11.210864186286926, "mean_norm/layer19": 11.28091686964035, "mean_norm/layer2": 9.08584862947464, "mean_norm/layer20": 11.38850075006485, "mean_norm/layer21": 11.352761268615723, "mean_norm/layer22": 12.517931997776031, "mean_norm/layer23": 12.469390869140625, "mean_norm/layer3": 11.968517303466797, "mean_norm/layer4": 10.497656643390656, "mean_norm/layer5": 13.405577003955841, "mean_norm/layer6": 9.910086631774902, "mean_norm/layer7": 10.536053538322449, "mean_norm/layer8": 11.111887276172638, "mean_norm/layer9": 11.025021851062775, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12700 }, { "epoch": 5.3, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4685105640800996, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7220449447631836, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8546, "eval_samples_per_second": 20.33, "eval_steps_per_second": 0.675, "step": 12700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.32, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3962, "max_norm": 40.18087387084961, "max_norm/layer0": 30.704357147216797, "max_norm/layer1": 32.41680145263672, "max_norm/layer10": 34.22196578979492, "max_norm/layer11": 31.54886245727539, "max_norm/layer12": 36.20389175415039, "max_norm/layer13": 31.789897918701172, "max_norm/layer14": 32.93586349487305, "max_norm/layer15": 39.839820861816406, "max_norm/layer16": 32.85014343261719, "max_norm/layer17": 40.18087387084961, "max_norm/layer18": 34.7507209777832, "max_norm/layer19": 34.320194244384766, "max_norm/layer2": 24.904115676879883, "max_norm/layer20": 34.61308670043945, "max_norm/layer21": 34.72566223144531, "max_norm/layer22": 35.28715896606445, "max_norm/layer23": 33.438289642333984, "max_norm/layer3": 31.39183235168457, "max_norm/layer4": 31.243642807006836, "max_norm/layer5": 39.70951461791992, "max_norm/layer6": 26.163026809692383, "max_norm/layer7": 34.013248443603516, "max_norm/layer8": 33.09016036987305, "max_norm/layer9": 33.44902801513672, "mean_norm": 11.350986532866955, "mean_norm/layer0": 11.135516226291656, "mean_norm/layer1": 10.794594943523407, "mean_norm/layer10": 11.12837165594101, "mean_norm/layer11": 11.509005963802338, "mean_norm/layer12": 12.210427522659302, "mean_norm/layer13": 11.150359153747559, "mean_norm/layer14": 11.592359781265259, "mean_norm/layer15": 12.007216930389404, "mean_norm/layer16": 11.22458028793335, "mean_norm/layer17": 11.773609936237335, "mean_norm/layer18": 11.219653248786926, "mean_norm/layer19": 11.29003256559372, "mean_norm/layer2": 9.089622676372528, "mean_norm/layer20": 11.397597908973694, "mean_norm/layer21": 11.361972987651825, "mean_norm/layer22": 12.5301353931427, "mean_norm/layer23": 12.481706082820892, "mean_norm/layer3": 11.98196655511856, "mean_norm/layer4": 10.505818009376526, "mean_norm/layer5": 13.423184752464294, "mean_norm/layer6": 9.916291773319244, "mean_norm/layer7": 10.543961584568024, "mean_norm/layer8": 11.121361255645752, "mean_norm/layer9": 11.03432959318161, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12750 }, { "epoch": 5.32, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4678575339798737, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.725661516189575, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6564, "eval_samples_per_second": 20.675, "eval_steps_per_second": 0.686, "step": 12750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.34, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4083, "max_norm": 40.30177307128906, "max_norm/layer0": 30.785463333129883, "max_norm/layer1": 32.49075698852539, "max_norm/layer10": 34.32855987548828, "max_norm/layer11": 31.61981773376465, "max_norm/layer12": 36.33092498779297, "max_norm/layer13": 31.879899978637695, "max_norm/layer14": 33.02179718017578, "max_norm/layer15": 39.950584411621094, "max_norm/layer16": 32.93088150024414, "max_norm/layer17": 40.30177307128906, "max_norm/layer18": 34.84276580810547, "max_norm/layer19": 34.421875, "max_norm/layer2": 24.946029663085938, "max_norm/layer20": 34.69622802734375, "max_norm/layer21": 34.828857421875, "max_norm/layer22": 35.38137435913086, "max_norm/layer23": 33.52065658569336, "max_norm/layer3": 31.4727783203125, "max_norm/layer4": 31.318620681762695, "max_norm/layer5": 39.80884552001953, "max_norm/layer6": 26.22019386291504, "max_norm/layer7": 34.104026794433594, "max_norm/layer8": 33.16169738769531, "max_norm/layer9": 33.532066345214844, "mean_norm": 11.361123723288378, "mean_norm/layer0": 11.1495241522789, "mean_norm/layer1": 10.804406702518463, "mean_norm/layer10": 11.137525200843811, "mean_norm/layer11": 11.519233465194702, "mean_norm/layer12": 12.2235426902771, "mean_norm/layer13": 11.16000908613205, "mean_norm/layer14": 11.602903127670288, "mean_norm/layer15": 12.019250571727753, "mean_norm/layer16": 11.234025776386261, "mean_norm/layer17": 11.783994853496552, "mean_norm/layer18": 11.228349685668945, "mean_norm/layer19": 11.299010992050171, "mean_norm/layer2": 9.093325853347778, "mean_norm/layer20": 11.406367242336273, "mean_norm/layer21": 11.370973885059357, "mean_norm/layer22": 12.54227989912033, "mean_norm/layer23": 12.49396014213562, "mean_norm/layer3": 11.995252788066864, "mean_norm/layer4": 10.513902842998505, "mean_norm/layer5": 13.440637111663818, "mean_norm/layer6": 9.922372043132782, "mean_norm/layer7": 10.55189323425293, "mean_norm/layer8": 11.13077861070633, "mean_norm/layer9": 11.043449401855469, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12800 }, { "epoch": 5.34, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4677601878779767, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7198004722595215, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6292, "eval_samples_per_second": 20.724, "eval_steps_per_second": 0.688, "step": 12800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.37, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3925, "max_norm": 40.42647933959961, "max_norm/layer0": 30.862247467041016, "max_norm/layer1": 32.58104705810547, "max_norm/layer10": 34.42935562133789, "max_norm/layer11": 31.688074111938477, "max_norm/layer12": 36.43111038208008, "max_norm/layer13": 31.962995529174805, "max_norm/layer14": 33.105018615722656, "max_norm/layer15": 40.07574462890625, "max_norm/layer16": 33.029239654541016, "max_norm/layer17": 40.42647933959961, "max_norm/layer18": 34.93319320678711, "max_norm/layer19": 34.51870346069336, "max_norm/layer2": 24.97833824157715, "max_norm/layer20": 34.78074645996094, "max_norm/layer21": 34.91769790649414, "max_norm/layer22": 35.466556549072266, "max_norm/layer23": 33.60380935668945, "max_norm/layer3": 31.545141220092773, "max_norm/layer4": 31.3936710357666, "max_norm/layer5": 39.9000129699707, "max_norm/layer6": 26.277626037597656, "max_norm/layer7": 34.1938591003418, "max_norm/layer8": 33.24137878417969, "max_norm/layer9": 33.62035369873047, "mean_norm": 11.371210957566896, "mean_norm/layer0": 11.163536846637726, "mean_norm/layer1": 10.814097344875336, "mean_norm/layer10": 11.146620213985443, "mean_norm/layer11": 11.529425144195557, "mean_norm/layer12": 12.236510634422302, "mean_norm/layer13": 11.1696857213974, "mean_norm/layer14": 11.61343002319336, "mean_norm/layer15": 12.031220376491547, "mean_norm/layer16": 11.243366599082947, "mean_norm/layer17": 11.79428768157959, "mean_norm/layer18": 11.236949563026428, "mean_norm/layer19": 11.307882249355316, "mean_norm/layer2": 9.097050428390503, "mean_norm/layer20": 11.415169477462769, "mean_norm/layer21": 11.379999816417694, "mean_norm/layer22": 12.554370284080505, "mean_norm/layer23": 12.506138384342194, "mean_norm/layer3": 12.008520364761353, "mean_norm/layer4": 10.52201795578003, "mean_norm/layer5": 13.457939386367798, "mean_norm/layer6": 9.928470611572266, "mean_norm/layer7": 10.559760689735413, "mean_norm/layer8": 11.140100836753845, "mean_norm/layer9": 11.052512347698212, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12850 }, { "epoch": 5.37, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46929744507043397, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.721813440322876, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8261, "eval_samples_per_second": 22.261, "eval_steps_per_second": 0.739, "step": 12850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.39, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4, "max_norm": 40.53966522216797, "max_norm/layer0": 30.93181610107422, "max_norm/layer1": 32.67628479003906, "max_norm/layer10": 34.52503204345703, "max_norm/layer11": 31.753511428833008, "max_norm/layer12": 36.52308654785156, "max_norm/layer13": 32.05752944946289, "max_norm/layer14": 33.178993225097656, "max_norm/layer15": 40.18899917602539, "max_norm/layer16": 33.12994384765625, "max_norm/layer17": 40.53966522216797, "max_norm/layer18": 35.019256591796875, "max_norm/layer19": 34.60889434814453, "max_norm/layer2": 25.012950897216797, "max_norm/layer20": 34.865150451660156, "max_norm/layer21": 34.9974479675293, "max_norm/layer22": 35.567359924316406, "max_norm/layer23": 33.68381881713867, "max_norm/layer3": 31.623594284057617, "max_norm/layer4": 31.476152420043945, "max_norm/layer5": 39.99509811401367, "max_norm/layer6": 26.33111000061035, "max_norm/layer7": 34.27658462524414, "max_norm/layer8": 33.315608978271484, "max_norm/layer9": 33.71103286743164, "mean_norm": 11.38135044525067, "mean_norm/layer0": 11.177644968032837, "mean_norm/layer1": 10.823881030082703, "mean_norm/layer10": 11.155748844146729, "mean_norm/layer11": 11.539595305919647, "mean_norm/layer12": 12.249578356742859, "mean_norm/layer13": 11.179333209991455, "mean_norm/layer14": 11.62400072813034, "mean_norm/layer15": 12.043241918087006, "mean_norm/layer16": 11.252710223197937, "mean_norm/layer17": 11.804608881473541, "mean_norm/layer18": 11.245511174201965, "mean_norm/layer19": 11.3168506026268, "mean_norm/layer2": 9.100809633731842, "mean_norm/layer20": 11.424018442630768, "mean_norm/layer21": 11.388995170593262, "mean_norm/layer22": 12.56649899482727, "mean_norm/layer23": 12.51846170425415, "mean_norm/layer3": 12.021824836730957, "mean_norm/layer4": 10.53019380569458, "mean_norm/layer5": 13.475353181362152, "mean_norm/layer6": 9.934614837169647, "mean_norm/layer7": 10.567758977413177, "mean_norm/layer8": 11.149481892585754, "mean_norm/layer9": 11.061693966388702, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12900 }, { "epoch": 5.39, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4691068089542189, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.717646837234497, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6585, "eval_samples_per_second": 20.672, "eval_steps_per_second": 0.686, "step": 12900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.41, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3993, "max_norm": 40.673301696777344, "max_norm/layer0": 30.998746871948242, "max_norm/layer1": 32.77350616455078, "max_norm/layer10": 34.62392807006836, "max_norm/layer11": 31.82044219970703, "max_norm/layer12": 36.621395111083984, "max_norm/layer13": 32.15480041503906, "max_norm/layer14": 33.264678955078125, "max_norm/layer15": 40.30952453613281, "max_norm/layer16": 33.21421813964844, "max_norm/layer17": 40.673301696777344, "max_norm/layer18": 35.126922607421875, "max_norm/layer19": 34.703487396240234, "max_norm/layer2": 25.046913146972656, "max_norm/layer20": 34.96284484863281, "max_norm/layer21": 35.083953857421875, "max_norm/layer22": 35.669921875, "max_norm/layer23": 33.7749137878418, "max_norm/layer3": 31.69327163696289, "max_norm/layer4": 31.55188751220703, "max_norm/layer5": 40.09039306640625, "max_norm/layer6": 26.382938385009766, "max_norm/layer7": 34.37516784667969, "max_norm/layer8": 33.3942985534668, "max_norm/layer9": 33.79991149902344, "mean_norm": 11.391558771332106, "mean_norm/layer0": 11.191831350326538, "mean_norm/layer1": 10.833774149417877, "mean_norm/layer10": 11.165005505084991, "mean_norm/layer11": 11.549969255924225, "mean_norm/layer12": 12.262792706489563, "mean_norm/layer13": 11.189042687416077, "mean_norm/layer14": 11.634574472904205, "mean_norm/layer15": 12.05532854795456, "mean_norm/layer16": 11.26214224100113, "mean_norm/layer17": 11.81501454114914, "mean_norm/layer18": 11.254182398319244, "mean_norm/layer19": 11.325855612754822, "mean_norm/layer2": 9.104621648788452, "mean_norm/layer20": 11.432913839817047, "mean_norm/layer21": 11.398003339767456, "mean_norm/layer22": 12.578662037849426, "mean_norm/layer23": 12.530750453472137, "mean_norm/layer3": 12.035245954990387, "mean_norm/layer4": 10.538455426692963, "mean_norm/layer5": 13.492934942245483, "mean_norm/layer6": 9.94073635339737, "mean_norm/layer7": 10.575691282749176, "mean_norm/layer8": 11.15895789861679, "mean_norm/layer9": 11.070923864841461, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 12950 }, { "epoch": 5.41, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4688512754367392, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.718743324279785, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8444, "eval_samples_per_second": 20.347, "eval_steps_per_second": 0.675, "step": 12950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.43, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4133, "max_norm": 40.796546936035156, "max_norm/layer0": 31.071434020996094, "max_norm/layer1": 32.860477447509766, "max_norm/layer10": 34.711509704589844, "max_norm/layer11": 31.88778305053711, "max_norm/layer12": 36.72361755371094, "max_norm/layer13": 32.25141525268555, "max_norm/layer14": 33.352420806884766, "max_norm/layer15": 40.42947769165039, "max_norm/layer16": 33.28781509399414, "max_norm/layer17": 40.796546936035156, "max_norm/layer18": 35.232322692871094, "max_norm/layer19": 34.80649185180664, "max_norm/layer2": 25.087366104125977, "max_norm/layer20": 35.050086975097656, "max_norm/layer21": 35.175132751464844, "max_norm/layer22": 35.75883865356445, "max_norm/layer23": 33.876068115234375, "max_norm/layer3": 31.762784957885742, "max_norm/layer4": 31.617982864379883, "max_norm/layer5": 40.18153762817383, "max_norm/layer6": 26.44247055053711, "max_norm/layer7": 34.473243713378906, "max_norm/layer8": 33.4754638671875, "max_norm/layer9": 33.89864730834961, "mean_norm": 11.40168750534455, "mean_norm/layer0": 11.205902516841888, "mean_norm/layer1": 10.84367960691452, "mean_norm/layer10": 11.174164533615112, "mean_norm/layer11": 11.560200273990631, "mean_norm/layer12": 12.275927484035492, "mean_norm/layer13": 11.198736369609833, "mean_norm/layer14": 11.64512050151825, "mean_norm/layer15": 12.067360758781433, "mean_norm/layer16": 11.271453142166138, "mean_norm/layer17": 11.825299143791199, "mean_norm/layer18": 11.262673079967499, "mean_norm/layer19": 11.33467322587967, "mean_norm/layer2": 9.108363032341003, "mean_norm/layer20": 11.441703617572784, "mean_norm/layer21": 11.406952321529388, "mean_norm/layer22": 12.590731382369995, "mean_norm/layer23": 12.543003857135773, "mean_norm/layer3": 12.048669159412384, "mean_norm/layer4": 10.546570122241974, "mean_norm/layer5": 13.510445177555084, "mean_norm/layer6": 9.946801245212555, "mean_norm/layer7": 10.583557188510895, "mean_norm/layer8": 11.168345034122467, "mean_norm/layer9": 11.080167353153229, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13000 }, { "epoch": 5.43, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4694231837853843, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.722926616668701, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6383, "eval_samples_per_second": 20.707, "eval_steps_per_second": 0.687, "step": 13000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.45, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4043, "max_norm": 40.9404296875, "max_norm/layer0": 31.16077423095703, "max_norm/layer1": 32.95548629760742, "max_norm/layer10": 34.809906005859375, "max_norm/layer11": 31.963796615600586, "max_norm/layer12": 36.830169677734375, "max_norm/layer13": 32.35176467895508, "max_norm/layer14": 33.43437194824219, "max_norm/layer15": 40.522647857666016, "max_norm/layer16": 33.36571502685547, "max_norm/layer17": 40.9404296875, "max_norm/layer18": 35.327171325683594, "max_norm/layer19": 34.913414001464844, "max_norm/layer2": 25.136255264282227, "max_norm/layer20": 35.13398742675781, "max_norm/layer21": 35.26042938232422, "max_norm/layer22": 35.85120391845703, "max_norm/layer23": 33.953338623046875, "max_norm/layer3": 31.837873458862305, "max_norm/layer4": 31.689170837402344, "max_norm/layer5": 40.275970458984375, "max_norm/layer6": 26.50471305847168, "max_norm/layer7": 34.56406021118164, "max_norm/layer8": 33.55378723144531, "max_norm/layer9": 33.99280548095703, "mean_norm": 11.41187767436107, "mean_norm/layer0": 11.22002124786377, "mean_norm/layer1": 10.853593170642853, "mean_norm/layer10": 11.183394372463226, "mean_norm/layer11": 11.570508360862732, "mean_norm/layer12": 12.289067327976227, "mean_norm/layer13": 11.208430171012878, "mean_norm/layer14": 11.65568321943283, "mean_norm/layer15": 12.07946515083313, "mean_norm/layer16": 11.280861020088196, "mean_norm/layer17": 11.835736393928528, "mean_norm/layer18": 11.271266996860504, "mean_norm/layer19": 11.343626499176025, "mean_norm/layer2": 9.112095832824707, "mean_norm/layer20": 11.450542509555817, "mean_norm/layer21": 11.416008174419403, "mean_norm/layer22": 12.602880716323853, "mean_norm/layer23": 12.555341303348541, "mean_norm/layer3": 12.062138319015503, "mean_norm/layer4": 10.554663360118866, "mean_norm/layer5": 13.528029143810272, "mean_norm/layer6": 9.952929139137268, "mean_norm/layer7": 10.591509401798248, "mean_norm/layer8": 11.177850186824799, "mean_norm/layer9": 11.089422166347504, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13050 }, { "epoch": 5.45, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4680278896581935, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7215194702148438, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6317, "eval_samples_per_second": 20.719, "eval_steps_per_second": 0.688, "step": 13050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.47, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4184, "max_norm": 41.073753356933594, "max_norm/layer0": 31.25911521911621, "max_norm/layer1": 33.047813415527344, "max_norm/layer10": 34.90483856201172, "max_norm/layer11": 32.04907989501953, "max_norm/layer12": 36.92471694946289, "max_norm/layer13": 32.446258544921875, "max_norm/layer14": 33.51337432861328, "max_norm/layer15": 40.64415740966797, "max_norm/layer16": 33.44923400878906, "max_norm/layer17": 41.073753356933594, "max_norm/layer18": 35.43497848510742, "max_norm/layer19": 35.00997543334961, "max_norm/layer2": 25.17824935913086, "max_norm/layer20": 35.21885299682617, "max_norm/layer21": 35.36158752441406, "max_norm/layer22": 35.92625045776367, "max_norm/layer23": 34.03020095825195, "max_norm/layer3": 31.913679122924805, "max_norm/layer4": 31.755531311035156, "max_norm/layer5": 40.36668014526367, "max_norm/layer6": 26.55792999267578, "max_norm/layer7": 34.648197174072266, "max_norm/layer8": 33.62436294555664, "max_norm/layer9": 34.08570098876953, "mean_norm": 11.421943314373493, "mean_norm/layer0": 11.233939230442047, "mean_norm/layer1": 10.863298058509827, "mean_norm/layer10": 11.192550837993622, "mean_norm/layer11": 11.580713331699371, "mean_norm/layer12": 12.302023231983185, "mean_norm/layer13": 11.218043863773346, "mean_norm/layer14": 11.666103959083557, "mean_norm/layer15": 12.091457724571228, "mean_norm/layer16": 11.29023402929306, "mean_norm/layer17": 11.846083104610443, "mean_norm/layer18": 11.27977341413498, "mean_norm/layer19": 11.352494895458221, "mean_norm/layer2": 9.115803480148315, "mean_norm/layer20": 11.45926821231842, "mean_norm/layer21": 11.42496120929718, "mean_norm/layer22": 12.614860355854034, "mean_norm/layer23": 12.567517876625061, "mean_norm/layer3": 12.075318932533264, "mean_norm/layer4": 10.562665104866028, "mean_norm/layer5": 13.545399487018585, "mean_norm/layer6": 9.9589102268219, "mean_norm/layer7": 10.599405288696289, "mean_norm/layer8": 11.187245190143585, "mean_norm/layer9": 11.098568499088287, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13100 }, { "epoch": 5.47, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46916359418032555, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7211787700653076, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8252, "eval_samples_per_second": 22.263, "eval_steps_per_second": 0.739, "step": 13100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.49, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4133, "max_norm": 41.19325637817383, "max_norm/layer0": 31.352529525756836, "max_norm/layer1": 33.13313293457031, "max_norm/layer10": 34.997493743896484, "max_norm/layer11": 32.13360595703125, "max_norm/layer12": 37.020450592041016, "max_norm/layer13": 32.550804138183594, "max_norm/layer14": 33.60025405883789, "max_norm/layer15": 40.751651763916016, "max_norm/layer16": 33.52793884277344, "max_norm/layer17": 41.19325637817383, "max_norm/layer18": 35.55864715576172, "max_norm/layer19": 35.10562515258789, "max_norm/layer2": 25.227224349975586, "max_norm/layer20": 35.30140686035156, "max_norm/layer21": 35.45964431762695, "max_norm/layer22": 36.017539978027344, "max_norm/layer23": 34.118995666503906, "max_norm/layer3": 31.98078155517578, "max_norm/layer4": 31.82782554626465, "max_norm/layer5": 40.46044921875, "max_norm/layer6": 26.614765167236328, "max_norm/layer7": 34.73370361328125, "max_norm/layer8": 33.699100494384766, "max_norm/layer9": 34.17997741699219, "mean_norm": 11.43214280406634, "mean_norm/layer0": 11.247965574264526, "mean_norm/layer1": 10.873225510120392, "mean_norm/layer10": 11.20186734199524, "mean_norm/layer11": 11.591102659702301, "mean_norm/layer12": 12.315137565135956, "mean_norm/layer13": 11.227831721305847, "mean_norm/layer14": 11.676612555980682, "mean_norm/layer15": 12.103615701198578, "mean_norm/layer16": 11.29973292350769, "mean_norm/layer17": 11.856513440608978, "mean_norm/layer18": 11.288440763950348, "mean_norm/layer19": 11.361487448215485, "mean_norm/layer2": 9.11957997083664, "mean_norm/layer20": 11.468166828155518, "mean_norm/layer21": 11.433948516845703, "mean_norm/layer22": 12.62698209285736, "mean_norm/layer23": 12.579815804958344, "mean_norm/layer3": 12.088749766349792, "mean_norm/layer4": 10.570803761482239, "mean_norm/layer5": 13.562963128089905, "mean_norm/layer6": 9.965040504932404, "mean_norm/layer7": 10.607343137264252, "mean_norm/layer8": 11.196721315383911, "mean_norm/layer9": 11.107779264450073, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13150 }, { "epoch": 5.49, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4688472193491602, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7161834239959717, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8658, "eval_samples_per_second": 20.31, "eval_steps_per_second": 0.674, "step": 13150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.51, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.412, "max_norm": 41.33484649658203, "max_norm/layer0": 31.432945251464844, "max_norm/layer1": 33.227447509765625, "max_norm/layer10": 35.095306396484375, "max_norm/layer11": 32.22079849243164, "max_norm/layer12": 37.126129150390625, "max_norm/layer13": 32.637577056884766, "max_norm/layer14": 33.67879104614258, "max_norm/layer15": 40.858245849609375, "max_norm/layer16": 33.607337951660156, "max_norm/layer17": 41.33484649658203, "max_norm/layer18": 35.682640075683594, "max_norm/layer19": 35.209678649902344, "max_norm/layer2": 25.263656616210938, "max_norm/layer20": 35.401668548583984, "max_norm/layer21": 35.54304885864258, "max_norm/layer22": 36.10606384277344, "max_norm/layer23": 34.20365524291992, "max_norm/layer3": 32.0433349609375, "max_norm/layer4": 31.899898529052734, "max_norm/layer5": 40.55813980102539, "max_norm/layer6": 26.6668643951416, "max_norm/layer7": 34.81508255004883, "max_norm/layer8": 33.77111053466797, "max_norm/layer9": 34.279014587402344, "mean_norm": 11.442247187097868, "mean_norm/layer0": 11.261785089969635, "mean_norm/layer1": 10.883079826831818, "mean_norm/layer10": 11.210987150669098, "mean_norm/layer11": 11.601315975189209, "mean_norm/layer12": 12.32822459936142, "mean_norm/layer13": 11.237483143806458, "mean_norm/layer14": 11.68710470199585, "mean_norm/layer15": 12.11562329530716, "mean_norm/layer16": 11.309135794639587, "mean_norm/layer17": 11.86676573753357, "mean_norm/layer18": 11.296909749507904, "mean_norm/layer19": 11.37040263414383, "mean_norm/layer2": 9.123386025428772, "mean_norm/layer20": 11.477011442184448, "mean_norm/layer21": 11.442870557308197, "mean_norm/layer22": 12.638907492160797, "mean_norm/layer23": 12.591942846775055, "mean_norm/layer3": 12.102109968662262, "mean_norm/layer4": 10.578868985176086, "mean_norm/layer5": 13.58046168088913, "mean_norm/layer6": 9.971136212348938, "mean_norm/layer7": 10.61527305841446, "mean_norm/layer8": 11.206160426139832, "mean_norm/layer9": 11.116986095905304, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13200 }, { "epoch": 5.51, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46872959280936793, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.717339515686035, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8507, "eval_samples_per_second": 20.336, "eval_steps_per_second": 0.675, "step": 13200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.53, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4223, "max_norm": 41.460872650146484, "max_norm/layer0": 31.52048110961914, "max_norm/layer1": 33.32143020629883, "max_norm/layer10": 35.188270568847656, "max_norm/layer11": 32.29136657714844, "max_norm/layer12": 37.231136322021484, "max_norm/layer13": 32.73362350463867, "max_norm/layer14": 33.75789260864258, "max_norm/layer15": 40.970985412597656, "max_norm/layer16": 33.6841926574707, "max_norm/layer17": 41.460872650146484, "max_norm/layer18": 35.798545837402344, "max_norm/layer19": 35.29481506347656, "max_norm/layer2": 25.29656219482422, "max_norm/layer20": 35.4903450012207, "max_norm/layer21": 35.632667541503906, "max_norm/layer22": 36.19403839111328, "max_norm/layer23": 34.284523010253906, "max_norm/layer3": 32.09943771362305, "max_norm/layer4": 31.967790603637695, "max_norm/layer5": 40.65348434448242, "max_norm/layer6": 26.707876205444336, "max_norm/layer7": 34.904991149902344, "max_norm/layer8": 33.850345611572266, "max_norm/layer9": 34.3624267578125, "mean_norm": 11.452307460208734, "mean_norm/layer0": 11.275518834590912, "mean_norm/layer1": 10.892802596092224, "mean_norm/layer10": 11.22011786699295, "mean_norm/layer11": 11.611432790756226, "mean_norm/layer12": 12.341229736804962, "mean_norm/layer13": 11.247182369232178, "mean_norm/layer14": 11.697576940059662, "mean_norm/layer15": 12.127613306045532, "mean_norm/layer16": 11.318461954593658, "mean_norm/layer17": 11.877028286457062, "mean_norm/layer18": 11.305418491363525, "mean_norm/layer19": 11.379250943660736, "mean_norm/layer2": 9.127110540866852, "mean_norm/layer20": 11.485674262046814, "mean_norm/layer21": 11.451743423938751, "mean_norm/layer22": 12.650978088378906, "mean_norm/layer23": 12.604095160961151, "mean_norm/layer3": 12.115413546562195, "mean_norm/layer4": 10.586904525756836, "mean_norm/layer5": 13.59795880317688, "mean_norm/layer6": 9.977186620235443, "mean_norm/layer7": 10.623132765293121, "mean_norm/layer8": 11.215501189231873, "mean_norm/layer9": 11.126046001911163, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13250 }, { "epoch": 5.53, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4688958924001087, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7104713916778564, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6498, "eval_samples_per_second": 20.687, "eval_steps_per_second": 0.687, "step": 13250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.55, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4168, "max_norm": 41.58987808227539, "max_norm/layer0": 31.605928421020508, "max_norm/layer1": 33.41110610961914, "max_norm/layer10": 35.28288650512695, "max_norm/layer11": 32.35896682739258, "max_norm/layer12": 37.328975677490234, "max_norm/layer13": 32.81481170654297, "max_norm/layer14": 33.8287353515625, "max_norm/layer15": 41.096561431884766, "max_norm/layer16": 33.78337860107422, "max_norm/layer17": 41.58987808227539, "max_norm/layer18": 35.9139289855957, "max_norm/layer19": 35.399471282958984, "max_norm/layer2": 25.34184455871582, "max_norm/layer20": 35.5942497253418, "max_norm/layer21": 35.72600173950195, "max_norm/layer22": 36.28502655029297, "max_norm/layer23": 34.368873596191406, "max_norm/layer3": 32.15465545654297, "max_norm/layer4": 32.03687286376953, "max_norm/layer5": 40.74073791503906, "max_norm/layer6": 26.754438400268555, "max_norm/layer7": 34.99358367919922, "max_norm/layer8": 33.9345703125, "max_norm/layer9": 34.452205657958984, "mean_norm": 11.462326402465502, "mean_norm/layer0": 11.28924685716629, "mean_norm/layer1": 10.902493834495544, "mean_norm/layer10": 11.229179680347443, "mean_norm/layer11": 11.621479094028473, "mean_norm/layer12": 12.354156792163849, "mean_norm/layer13": 11.256803750991821, "mean_norm/layer14": 11.707986295223236, "mean_norm/layer15": 12.139529526233673, "mean_norm/layer16": 11.327766597270966, "mean_norm/layer17": 11.887259781360626, "mean_norm/layer18": 11.313856422901154, "mean_norm/layer19": 11.38800984621048, "mean_norm/layer2": 9.13087511062622, "mean_norm/layer20": 11.49438589811325, "mean_norm/layer21": 11.460516810417175, "mean_norm/layer22": 12.663020372390747, "mean_norm/layer23": 12.616227269172668, "mean_norm/layer3": 12.128678977489471, "mean_norm/layer4": 10.594914734363556, "mean_norm/layer5": 13.615288376808167, "mean_norm/layer6": 9.983207881450653, "mean_norm/layer7": 10.631061017513275, "mean_norm/layer8": 11.224867701530457, "mean_norm/layer9": 11.135021030902863, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13300 }, { "epoch": 5.55, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46990991429486945, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7142724990844727, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6426, "eval_samples_per_second": 20.7, "eval_steps_per_second": 0.687, "step": 13300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.57, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4235, "max_norm": 41.713775634765625, "max_norm/layer0": 31.692907333374023, "max_norm/layer1": 33.50731658935547, "max_norm/layer10": 35.388431549072266, "max_norm/layer11": 32.41889190673828, "max_norm/layer12": 37.428932189941406, "max_norm/layer13": 32.89790344238281, "max_norm/layer14": 33.91184997558594, "max_norm/layer15": 41.21902847290039, "max_norm/layer16": 33.867496490478516, "max_norm/layer17": 41.713775634765625, "max_norm/layer18": 36.05093765258789, "max_norm/layer19": 35.49272155761719, "max_norm/layer2": 25.380748748779297, "max_norm/layer20": 35.684383392333984, "max_norm/layer21": 35.81870651245117, "max_norm/layer22": 36.37220764160156, "max_norm/layer23": 34.44894027709961, "max_norm/layer3": 32.21410369873047, "max_norm/layer4": 32.11796569824219, "max_norm/layer5": 40.8372802734375, "max_norm/layer6": 26.808568954467773, "max_norm/layer7": 35.08625793457031, "max_norm/layer8": 34.01543426513672, "max_norm/layer9": 34.54030227661133, "mean_norm": 11.472280822694302, "mean_norm/layer0": 11.302962839603424, "mean_norm/layer1": 10.912257492542267, "mean_norm/layer10": 11.238200902938843, "mean_norm/layer11": 11.631586790084839, "mean_norm/layer12": 12.366995334625244, "mean_norm/layer13": 11.266227841377258, "mean_norm/layer14": 11.718317866325378, "mean_norm/layer15": 12.151341676712036, "mean_norm/layer16": 11.337043285369873, "mean_norm/layer17": 11.89738005399704, "mean_norm/layer18": 11.322262048721313, "mean_norm/layer19": 11.39665973186493, "mean_norm/layer2": 9.134590566158295, "mean_norm/layer20": 11.503011286258698, "mean_norm/layer21": 11.469366490840912, "mean_norm/layer22": 12.674902260303497, "mean_norm/layer23": 12.628194808959961, "mean_norm/layer3": 12.14181238412857, "mean_norm/layer4": 10.602854549884796, "mean_norm/layer5": 13.632572889328003, "mean_norm/layer6": 9.989143371582031, "mean_norm/layer7": 10.638879597187042, "mean_norm/layer8": 11.23413860797882, "mean_norm/layer9": 11.144037067890167, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13350 }, { "epoch": 5.57, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46916359418032555, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.714078426361084, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8326, "eval_samples_per_second": 20.367, "eval_steps_per_second": 0.676, "step": 13350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.59, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4219, "max_norm": 41.837982177734375, "max_norm/layer0": 31.79075813293457, "max_norm/layer1": 33.60240936279297, "max_norm/layer10": 35.48202896118164, "max_norm/layer11": 32.483062744140625, "max_norm/layer12": 37.52994155883789, "max_norm/layer13": 32.990882873535156, "max_norm/layer14": 33.9993782043457, "max_norm/layer15": 41.33662414550781, "max_norm/layer16": 33.95119094848633, "max_norm/layer17": 41.837982177734375, "max_norm/layer18": 36.17069625854492, "max_norm/layer19": 35.598567962646484, "max_norm/layer2": 25.41947364807129, "max_norm/layer20": 35.76862716674805, "max_norm/layer21": 35.891048431396484, "max_norm/layer22": 36.46067810058594, "max_norm/layer23": 34.52641296386719, "max_norm/layer3": 32.27833938598633, "max_norm/layer4": 32.184410095214844, "max_norm/layer5": 40.935646057128906, "max_norm/layer6": 26.854347229003906, "max_norm/layer7": 35.179630279541016, "max_norm/layer8": 34.0980110168457, "max_norm/layer9": 34.62184143066406, "mean_norm": 11.482310282687346, "mean_norm/layer0": 11.316719889640808, "mean_norm/layer1": 10.922053396701813, "mean_norm/layer10": 11.247276484966278, "mean_norm/layer11": 11.64177393913269, "mean_norm/layer12": 12.379945814609528, "mean_norm/layer13": 11.275794327259064, "mean_norm/layer14": 11.72872668504715, "mean_norm/layer15": 12.163222134113312, "mean_norm/layer16": 11.346361517906189, "mean_norm/layer17": 11.907587885856628, "mean_norm/layer18": 11.330709755420685, "mean_norm/layer19": 11.40546178817749, "mean_norm/layer2": 9.138280272483826, "mean_norm/layer20": 11.511772215366364, "mean_norm/layer21": 11.478142619132996, "mean_norm/layer22": 12.686840951442719, "mean_norm/layer23": 12.640309393405914, "mean_norm/layer3": 12.155011892318726, "mean_norm/layer4": 10.610854387283325, "mean_norm/layer5": 13.649908483028412, "mean_norm/layer6": 9.995129764080048, "mean_norm/layer7": 10.6467826962471, "mean_norm/layer8": 11.243535876274109, "mean_norm/layer9": 11.153244614601135, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13400 }, { "epoch": 5.59, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46905813590327045, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.711637496948242, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6452, "eval_samples_per_second": 20.695, "eval_steps_per_second": 0.687, "step": 13400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.62, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4137, "max_norm": 41.95629119873047, "max_norm/layer0": 31.894800186157227, "max_norm/layer1": 33.70528793334961, "max_norm/layer10": 35.5774040222168, "max_norm/layer11": 32.56145095825195, "max_norm/layer12": 37.62503433227539, "max_norm/layer13": 33.0743408203125, "max_norm/layer14": 34.08401107788086, "max_norm/layer15": 41.45420455932617, "max_norm/layer16": 34.023075103759766, "max_norm/layer17": 41.95629119873047, "max_norm/layer18": 36.291751861572266, "max_norm/layer19": 35.699798583984375, "max_norm/layer2": 25.462074279785156, "max_norm/layer20": 35.848453521728516, "max_norm/layer21": 35.9924430847168, "max_norm/layer22": 36.55889892578125, "max_norm/layer23": 34.61848449707031, "max_norm/layer3": 32.35057830810547, "max_norm/layer4": 32.256893157958984, "max_norm/layer5": 41.03318786621094, "max_norm/layer6": 26.913339614868164, "max_norm/layer7": 35.26021957397461, "max_norm/layer8": 34.18633270263672, "max_norm/layer9": 34.706512451171875, "mean_norm": 11.492379434406757, "mean_norm/layer0": 11.330553650856018, "mean_norm/layer1": 10.931818127632141, "mean_norm/layer10": 11.256403625011444, "mean_norm/layer11": 11.652017891407013, "mean_norm/layer12": 12.392934620380402, "mean_norm/layer13": 11.2853382229805, "mean_norm/layer14": 11.739181399345398, "mean_norm/layer15": 12.175087809562683, "mean_norm/layer16": 11.355721652507782, "mean_norm/layer17": 11.917894303798676, "mean_norm/layer18": 11.339221060276031, "mean_norm/layer19": 11.414319634437561, "mean_norm/layer2": 9.14203691482544, "mean_norm/layer20": 11.520379364490509, "mean_norm/layer21": 11.487022876739502, "mean_norm/layer22": 12.698857307434082, "mean_norm/layer23": 12.652542471885681, "mean_norm/layer3": 12.168289422988892, "mean_norm/layer4": 10.618834555149078, "mean_norm/layer5": 13.667337656021118, "mean_norm/layer6": 10.001234710216522, "mean_norm/layer7": 10.654753506183624, "mean_norm/layer8": 11.252941370010376, "mean_norm/layer9": 11.162384271621704, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13450 }, { "epoch": 5.62, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4691311454796932, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.709066390991211, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6434, "eval_samples_per_second": 20.698, "eval_steps_per_second": 0.687, "step": 13450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.64, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4237, "max_norm": 42.06662368774414, "max_norm/layer0": 31.995527267456055, "max_norm/layer1": 33.81433868408203, "max_norm/layer10": 35.674861907958984, "max_norm/layer11": 32.633907318115234, "max_norm/layer12": 37.72537612915039, "max_norm/layer13": 33.15221405029297, "max_norm/layer14": 34.16411590576172, "max_norm/layer15": 41.57180404663086, "max_norm/layer16": 34.10177993774414, "max_norm/layer17": 42.06662368774414, "max_norm/layer18": 36.408756256103516, "max_norm/layer19": 35.804447174072266, "max_norm/layer2": 25.517255783081055, "max_norm/layer20": 35.92195129394531, "max_norm/layer21": 36.10334777832031, "max_norm/layer22": 36.6356086730957, "max_norm/layer23": 34.714378356933594, "max_norm/layer3": 32.415916442871094, "max_norm/layer4": 32.33707046508789, "max_norm/layer5": 41.12393569946289, "max_norm/layer6": 26.9628849029541, "max_norm/layer7": 35.34476852416992, "max_norm/layer8": 34.27030563354492, "max_norm/layer9": 34.790771484375, "mean_norm": 11.502338218192259, "mean_norm/layer0": 11.344147622585297, "mean_norm/layer1": 10.941574037075043, "mean_norm/layer10": 11.26539170742035, "mean_norm/layer11": 11.66208666563034, "mean_norm/layer12": 12.405764102935791, "mean_norm/layer13": 11.294852435588837, "mean_norm/layer14": 11.749512732028961, "mean_norm/layer15": 12.18685758113861, "mean_norm/layer16": 11.364993393421173, "mean_norm/layer17": 11.928065538406372, "mean_norm/layer18": 11.347671389579773, "mean_norm/layer19": 11.423152148723602, "mean_norm/layer2": 9.145713448524475, "mean_norm/layer20": 11.52916818857193, "mean_norm/layer21": 11.49576997756958, "mean_norm/layer22": 12.710700571537018, "mean_norm/layer23": 12.664546847343445, "mean_norm/layer3": 12.181446313858032, "mean_norm/layer4": 10.626774251461029, "mean_norm/layer5": 13.684615194797516, "mean_norm/layer6": 10.00717294216156, "mean_norm/layer7": 10.662572145462036, "mean_norm/layer8": 11.262239933013916, "mean_norm/layer9": 11.171328067779541, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13500 }, { "epoch": 5.64, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4694353520481214, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7050700187683105, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.81, "eval_samples_per_second": 22.294, "eval_steps_per_second": 0.74, "step": 13500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.66, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4288, "max_norm": 42.18446350097656, "max_norm/layer0": 32.09495162963867, "max_norm/layer1": 33.92106246948242, "max_norm/layer10": 35.778926849365234, "max_norm/layer11": 32.708717346191406, "max_norm/layer12": 37.83408737182617, "max_norm/layer13": 33.22709274291992, "max_norm/layer14": 34.2531852722168, "max_norm/layer15": 41.674163818359375, "max_norm/layer16": 34.1853141784668, "max_norm/layer17": 42.18446350097656, "max_norm/layer18": 36.49985885620117, "max_norm/layer19": 35.90671157836914, "max_norm/layer2": 25.565250396728516, "max_norm/layer20": 36.003273010253906, "max_norm/layer21": 36.20390319824219, "max_norm/layer22": 36.71393585205078, "max_norm/layer23": 34.7982292175293, "max_norm/layer3": 32.48151397705078, "max_norm/layer4": 32.41646194458008, "max_norm/layer5": 41.22113800048828, "max_norm/layer6": 27.021968841552734, "max_norm/layer7": 35.427452087402344, "max_norm/layer8": 34.34320068359375, "max_norm/layer9": 34.87732696533203, "mean_norm": 11.512315717836222, "mean_norm/layer0": 11.357698917388916, "mean_norm/layer1": 10.951256394386292, "mean_norm/layer10": 11.274416208267212, "mean_norm/layer11": 11.672086000442505, "mean_norm/layer12": 12.41863089799881, "mean_norm/layer13": 11.30438607931137, "mean_norm/layer14": 11.759986698627472, "mean_norm/layer15": 12.198642432689667, "mean_norm/layer16": 11.374230086803436, "mean_norm/layer17": 11.938192427158356, "mean_norm/layer18": 11.356159150600433, "mean_norm/layer19": 11.432008922100067, "mean_norm/layer2": 9.14939570426941, "mean_norm/layer20": 11.537839412689209, "mean_norm/layer21": 11.504580557346344, "mean_norm/layer22": 12.722698092460632, "mean_norm/layer23": 12.676586389541626, "mean_norm/layer3": 12.194705128669739, "mean_norm/layer4": 10.634714663028717, "mean_norm/layer5": 13.701936960220337, "mean_norm/layer6": 10.013112783432007, "mean_norm/layer7": 10.670415759086609, "mean_norm/layer8": 11.271536707878113, "mean_norm/layer9": 11.180360853672028, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13550 }, { "epoch": 5.66, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46922037940643213, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7097346782684326, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.847, "eval_samples_per_second": 20.343, "eval_steps_per_second": 0.675, "step": 13550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.68, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.417, "max_norm": 42.29948043823242, "max_norm/layer0": 32.19629669189453, "max_norm/layer1": 34.0298957824707, "max_norm/layer10": 35.873329162597656, "max_norm/layer11": 32.782554626464844, "max_norm/layer12": 37.94023895263672, "max_norm/layer13": 33.30521011352539, "max_norm/layer14": 34.3357048034668, "max_norm/layer15": 41.79225540161133, "max_norm/layer16": 34.278114318847656, "max_norm/layer17": 42.29948043823242, "max_norm/layer18": 36.587486267089844, "max_norm/layer19": 36.01373291015625, "max_norm/layer2": 25.616296768188477, "max_norm/layer20": 36.0982780456543, "max_norm/layer21": 36.2936897277832, "max_norm/layer22": 36.797672271728516, "max_norm/layer23": 34.886837005615234, "max_norm/layer3": 32.53889846801758, "max_norm/layer4": 32.496707916259766, "max_norm/layer5": 41.32212448120117, "max_norm/layer6": 27.078197479248047, "max_norm/layer7": 35.5162467956543, "max_norm/layer8": 34.416038513183594, "max_norm/layer9": 34.968238830566406, "mean_norm": 11.52224476635456, "mean_norm/layer0": 11.371230006217957, "mean_norm/layer1": 10.96083915233612, "mean_norm/layer10": 11.283371925354004, "mean_norm/layer11": 11.682111740112305, "mean_norm/layer12": 12.431476056575775, "mean_norm/layer13": 11.313903331756592, "mean_norm/layer14": 11.770337045192719, "mean_norm/layer15": 12.210534811019897, "mean_norm/layer16": 11.383462309837341, "mean_norm/layer17": 11.948289573192596, "mean_norm/layer18": 11.364611744880676, "mean_norm/layer19": 11.440718173980713, "mean_norm/layer2": 9.153079271316528, "mean_norm/layer20": 11.54639196395874, "mean_norm/layer21": 11.51335096359253, "mean_norm/layer22": 12.734551429748535, "mean_norm/layer23": 12.68855208158493, "mean_norm/layer3": 12.207791090011597, "mean_norm/layer4": 10.642626106739044, "mean_norm/layer5": 13.719220459461212, "mean_norm/layer6": 10.01904433965683, "mean_norm/layer7": 10.678197205066681, "mean_norm/layer8": 11.280803203582764, "mean_norm/layer9": 11.189380407333374, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13600 }, { "epoch": 5.68, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4692325476691693, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7084743976593018, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8418, "eval_samples_per_second": 20.352, "eval_steps_per_second": 0.676, "step": 13600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.7, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4312, "max_norm": 42.4152717590332, "max_norm/layer0": 32.290565490722656, "max_norm/layer1": 34.130165100097656, "max_norm/layer10": 35.96076202392578, "max_norm/layer11": 32.853206634521484, "max_norm/layer12": 38.056854248046875, "max_norm/layer13": 33.386722564697266, "max_norm/layer14": 34.417293548583984, "max_norm/layer15": 41.91092300415039, "max_norm/layer16": 34.39151382446289, "max_norm/layer17": 42.4152717590332, "max_norm/layer18": 36.677120208740234, "max_norm/layer19": 36.10676956176758, "max_norm/layer2": 25.653728485107422, "max_norm/layer20": 36.18156051635742, "max_norm/layer21": 36.40180969238281, "max_norm/layer22": 36.877620697021484, "max_norm/layer23": 34.97404479980469, "max_norm/layer3": 32.59130096435547, "max_norm/layer4": 32.57655334472656, "max_norm/layer5": 41.421573638916016, "max_norm/layer6": 27.125125885009766, "max_norm/layer7": 35.60506057739258, "max_norm/layer8": 34.491661071777344, "max_norm/layer9": 35.03976821899414, "mean_norm": 11.532145649194717, "mean_norm/layer0": 11.38479232788086, "mean_norm/layer1": 10.970433294773102, "mean_norm/layer10": 11.292322337627411, "mean_norm/layer11": 11.692193269729614, "mean_norm/layer12": 12.444232642650604, "mean_norm/layer13": 11.323309123516083, "mean_norm/layer14": 11.780568301677704, "mean_norm/layer15": 12.2222620844841, "mean_norm/layer16": 11.392680704593658, "mean_norm/layer17": 11.958375811576843, "mean_norm/layer18": 11.373052775859833, "mean_norm/layer19": 11.449408113956451, "mean_norm/layer2": 9.156772315502167, "mean_norm/layer20": 11.555001676082611, "mean_norm/layer21": 11.522112011909485, "mean_norm/layer22": 12.746351480484009, "mean_norm/layer23": 12.700541198253632, "mean_norm/layer3": 12.220799148082733, "mean_norm/layer4": 10.650478422641754, "mean_norm/layer5": 13.736432790756226, "mean_norm/layer6": 10.024990856647491, "mean_norm/layer7": 10.685915529727936, "mean_norm/layer8": 11.290149748325348, "mean_norm/layer9": 11.198319613933563, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13650 }, { "epoch": 5.7, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4698977460321323, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.709822177886963, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8453, "eval_samples_per_second": 20.346, "eval_steps_per_second": 0.675, "step": 13650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.72, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4277, "max_norm": 42.53453063964844, "max_norm/layer0": 32.37334060668945, "max_norm/layer1": 34.23046875, "max_norm/layer10": 36.06345748901367, "max_norm/layer11": 32.92584228515625, "max_norm/layer12": 38.15459442138672, "max_norm/layer13": 33.48106002807617, "max_norm/layer14": 34.505126953125, "max_norm/layer15": 42.039798736572266, "max_norm/layer16": 34.5018196105957, "max_norm/layer17": 42.53453063964844, "max_norm/layer18": 36.77006530761719, "max_norm/layer19": 36.20204162597656, "max_norm/layer2": 25.69436264038086, "max_norm/layer20": 36.26368713378906, "max_norm/layer21": 36.49669647216797, "max_norm/layer22": 36.958030700683594, "max_norm/layer23": 35.077667236328125, "max_norm/layer3": 32.64958953857422, "max_norm/layer4": 32.6416130065918, "max_norm/layer5": 41.52423858642578, "max_norm/layer6": 27.177854537963867, "max_norm/layer7": 35.69281005859375, "max_norm/layer8": 34.58332061767578, "max_norm/layer9": 35.11589050292969, "mean_norm": 11.542051893969377, "mean_norm/layer0": 11.398241758346558, "mean_norm/layer1": 10.9800386428833, "mean_norm/layer10": 11.301402509212494, "mean_norm/layer11": 11.70227837562561, "mean_norm/layer12": 12.457101702690125, "mean_norm/layer13": 11.332804679870605, "mean_norm/layer14": 11.790894746780396, "mean_norm/layer15": 12.233994662761688, "mean_norm/layer16": 11.401872217655182, "mean_norm/layer17": 11.96843957901001, "mean_norm/layer18": 11.381479799747467, "mean_norm/layer19": 11.45817643404007, "mean_norm/layer2": 9.160508751869202, "mean_norm/layer20": 11.563453137874603, "mean_norm/layer21": 11.530731439590454, "mean_norm/layer22": 12.75810968875885, "mean_norm/layer23": 12.712501466274261, "mean_norm/layer3": 12.233920216560364, "mean_norm/layer4": 10.658356189727783, "mean_norm/layer5": 13.753542840480804, "mean_norm/layer6": 10.030904114246368, "mean_norm/layer7": 10.693680703639984, "mean_norm/layer8": 11.299498975276947, "mean_norm/layer9": 11.207312822341919, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13700 }, { "epoch": 5.72, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47006810171045216, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.705110549926758, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8501, "eval_samples_per_second": 20.337, "eval_steps_per_second": 0.675, "step": 13700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.74, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4468, "max_norm": 42.64570999145508, "max_norm/layer0": 32.44587707519531, "max_norm/layer1": 34.328102111816406, "max_norm/layer10": 36.16082763671875, "max_norm/layer11": 32.99917984008789, "max_norm/layer12": 38.26010513305664, "max_norm/layer13": 33.561012268066406, "max_norm/layer14": 34.574607849121094, "max_norm/layer15": 42.16282653808594, "max_norm/layer16": 34.6053466796875, "max_norm/layer17": 42.64570999145508, "max_norm/layer18": 36.88127899169922, "max_norm/layer19": 36.302093505859375, "max_norm/layer2": 25.726064682006836, "max_norm/layer20": 36.354103088378906, "max_norm/layer21": 36.58729934692383, "max_norm/layer22": 37.044952392578125, "max_norm/layer23": 35.16257858276367, "max_norm/layer3": 32.70930480957031, "max_norm/layer4": 32.71389389038086, "max_norm/layer5": 41.630611419677734, "max_norm/layer6": 27.24214744567871, "max_norm/layer7": 35.78268051147461, "max_norm/layer8": 34.67084503173828, "max_norm/layer9": 35.19058609008789, "mean_norm": 11.55191034078598, "mean_norm/layer0": 11.41158139705658, "mean_norm/layer1": 10.989613711833954, "mean_norm/layer10": 11.31038248538971, "mean_norm/layer11": 11.712275445461273, "mean_norm/layer12": 12.469912946224213, "mean_norm/layer13": 11.342234253883362, "mean_norm/layer14": 11.801217436790466, "mean_norm/layer15": 12.245729267597198, "mean_norm/layer16": 11.411094605922699, "mean_norm/layer17": 11.978409945964813, "mean_norm/layer18": 11.38983964920044, "mean_norm/layer19": 11.466777920722961, "mean_norm/layer2": 9.164218246936798, "mean_norm/layer20": 11.571929335594177, "mean_norm/layer21": 11.539337873458862, "mean_norm/layer22": 12.769851624965668, "mean_norm/layer23": 12.7243931889534, "mean_norm/layer3": 12.246965825557709, "mean_norm/layer4": 10.66619747877121, "mean_norm/layer5": 13.770685732364655, "mean_norm/layer6": 10.03677612543106, "mean_norm/layer7": 10.701447129249573, "mean_norm/layer8": 11.308717370033264, "mean_norm/layer9": 11.216259181499481, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13750 }, { "epoch": 5.74, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4706521783218343, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7009119987487793, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8368, "eval_samples_per_second": 20.36, "eval_steps_per_second": 0.676, "step": 13750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.76, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4278, "max_norm": 42.74515151977539, "max_norm/layer0": 32.518287658691406, "max_norm/layer1": 34.43461990356445, "max_norm/layer10": 36.25341033935547, "max_norm/layer11": 33.06514358520508, "max_norm/layer12": 38.34977340698242, "max_norm/layer13": 33.64243698120117, "max_norm/layer14": 34.654720306396484, "max_norm/layer15": 42.259647369384766, "max_norm/layer16": 34.71818542480469, "max_norm/layer17": 42.74515151977539, "max_norm/layer18": 36.984222412109375, "max_norm/layer19": 36.397159576416016, "max_norm/layer2": 25.7700252532959, "max_norm/layer20": 36.44501876831055, "max_norm/layer21": 36.675048828125, "max_norm/layer22": 37.133079528808594, "max_norm/layer23": 35.23983383178711, "max_norm/layer3": 32.766868591308594, "max_norm/layer4": 32.78180694580078, "max_norm/layer5": 41.73137283325195, "max_norm/layer6": 27.297748565673828, "max_norm/layer7": 35.863887786865234, "max_norm/layer8": 34.7591438293457, "max_norm/layer9": 35.272220611572266, "mean_norm": 11.561812994380793, "mean_norm/layer0": 11.425028920173645, "mean_norm/layer1": 10.999259412288666, "mean_norm/layer10": 11.319396913051605, "mean_norm/layer11": 11.722336232662201, "mean_norm/layer12": 12.482789993286133, "mean_norm/layer13": 11.35170429944992, "mean_norm/layer14": 11.811590790748596, "mean_norm/layer15": 12.257381975650787, "mean_norm/layer16": 11.42035436630249, "mean_norm/layer17": 11.988508760929108, "mean_norm/layer18": 11.398184061050415, "mean_norm/layer19": 11.475438952445984, "mean_norm/layer2": 9.167939245700836, "mean_norm/layer20": 11.580475270748138, "mean_norm/layer21": 11.548064768314362, "mean_norm/layer22": 12.781589150428772, "mean_norm/layer23": 12.736304581165314, "mean_norm/layer3": 12.26003360748291, "mean_norm/layer4": 10.674065291881561, "mean_norm/layer5": 13.787844359874725, "mean_norm/layer6": 10.04273635149002, "mean_norm/layer7": 10.709193885326385, "mean_norm/layer8": 11.318026006221771, "mean_norm/layer9": 11.22526466846466, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13800 }, { "epoch": 5.76, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4695935394637041, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7042880058288574, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8457, "eval_samples_per_second": 20.345, "eval_steps_per_second": 0.675, "step": 13800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.78, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4311, "max_norm": 42.867034912109375, "max_norm/layer0": 32.59137725830078, "max_norm/layer1": 34.52602767944336, "max_norm/layer10": 36.34048080444336, "max_norm/layer11": 33.140743255615234, "max_norm/layer12": 38.443443298339844, "max_norm/layer13": 33.72990798950195, "max_norm/layer14": 34.72901916503906, "max_norm/layer15": 42.37352752685547, "max_norm/layer16": 34.81253433227539, "max_norm/layer17": 42.867034912109375, "max_norm/layer18": 37.07355499267578, "max_norm/layer19": 36.49341583251953, "max_norm/layer2": 25.837297439575195, "max_norm/layer20": 36.53437042236328, "max_norm/layer21": 36.775245666503906, "max_norm/layer22": 37.215858459472656, "max_norm/layer23": 35.314640045166016, "max_norm/layer3": 32.82737731933594, "max_norm/layer4": 32.852108001708984, "max_norm/layer5": 41.8297233581543, "max_norm/layer6": 27.339946746826172, "max_norm/layer7": 35.94553756713867, "max_norm/layer8": 34.851322174072266, "max_norm/layer9": 35.35096740722656, "mean_norm": 11.571596026420593, "mean_norm/layer0": 11.438275337219238, "mean_norm/layer1": 11.008784472942352, "mean_norm/layer10": 11.328203916549683, "mean_norm/layer11": 11.732258260250092, "mean_norm/layer12": 12.495415687561035, "mean_norm/layer13": 11.360939621925354, "mean_norm/layer14": 11.821831226348877, "mean_norm/layer15": 12.269017338752747, "mean_norm/layer16": 11.429407954216003, "mean_norm/layer17": 11.99849796295166, "mean_norm/layer18": 11.406443893909454, "mean_norm/layer19": 11.4840726852417, "mean_norm/layer2": 9.171578586101532, "mean_norm/layer20": 11.589037954807281, "mean_norm/layer21": 11.55676382780075, "mean_norm/layer22": 12.793222546577454, "mean_norm/layer23": 12.748144805431366, "mean_norm/layer3": 12.27302098274231, "mean_norm/layer4": 10.68181574344635, "mean_norm/layer5": 13.804852664470673, "mean_norm/layer6": 10.048506796360016, "mean_norm/layer7": 10.716846406459808, "mean_norm/layer8": 11.327199518680573, "mean_norm/layer9": 11.234166443347931, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13850 }, { "epoch": 5.78, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4705913370081487, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7011148929595947, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6359, "eval_samples_per_second": 20.712, "eval_steps_per_second": 0.688, "step": 13850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.8, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4379, "max_norm": 42.9991340637207, "max_norm/layer0": 32.67675018310547, "max_norm/layer1": 34.62179183959961, "max_norm/layer10": 36.44373321533203, "max_norm/layer11": 33.20524978637695, "max_norm/layer12": 38.551753997802734, "max_norm/layer13": 33.821502685546875, "max_norm/layer14": 34.808998107910156, "max_norm/layer15": 42.49689483642578, "max_norm/layer16": 34.90584182739258, "max_norm/layer17": 42.9991340637207, "max_norm/layer18": 37.173526763916016, "max_norm/layer19": 36.60969161987305, "max_norm/layer2": 25.892879486083984, "max_norm/layer20": 36.612857818603516, "max_norm/layer21": 36.875526428222656, "max_norm/layer22": 37.30345153808594, "max_norm/layer23": 35.393680572509766, "max_norm/layer3": 32.886417388916016, "max_norm/layer4": 32.9256591796875, "max_norm/layer5": 41.92585372924805, "max_norm/layer6": 27.39628028869629, "max_norm/layer7": 36.030879974365234, "max_norm/layer8": 34.93297576904297, "max_norm/layer9": 35.42243194580078, "mean_norm": 11.581335020562014, "mean_norm/layer0": 11.45145434141159, "mean_norm/layer1": 11.018277168273926, "mean_norm/layer10": 11.33707845211029, "mean_norm/layer11": 11.742176473140717, "mean_norm/layer12": 12.507989645004272, "mean_norm/layer13": 11.370223939418793, "mean_norm/layer14": 11.831981182098389, "mean_norm/layer15": 12.280655086040497, "mean_norm/layer16": 11.438491344451904, "mean_norm/layer17": 12.00839626789093, "mean_norm/layer18": 11.414667963981628, "mean_norm/layer19": 11.49258005619049, "mean_norm/layer2": 9.175205826759338, "mean_norm/layer20": 11.597498834133148, "mean_norm/layer21": 11.565355122089386, "mean_norm/layer22": 12.804871678352356, "mean_norm/layer23": 12.75985324382782, "mean_norm/layer3": 12.285956501960754, "mean_norm/layer4": 10.689500033855438, "mean_norm/layer5": 13.821775257587433, "mean_norm/layer6": 10.054342985153198, "mean_norm/layer7": 10.724383294582367, "mean_norm/layer8": 11.336312234401703, "mean_norm/layer9": 11.243013560771942, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13900 }, { "epoch": 5.8, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47070085137278284, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7012670040130615, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8509, "eval_samples_per_second": 20.336, "eval_steps_per_second": 0.675, "step": 13900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.82, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4347, "max_norm": 43.10231018066406, "max_norm/layer0": 32.753517150878906, "max_norm/layer1": 34.715728759765625, "max_norm/layer10": 36.539344787597656, "max_norm/layer11": 33.28629684448242, "max_norm/layer12": 38.66322326660156, "max_norm/layer13": 33.89580535888672, "max_norm/layer14": 34.89205551147461, "max_norm/layer15": 42.609230041503906, "max_norm/layer16": 35.00455093383789, "max_norm/layer17": 43.10231018066406, "max_norm/layer18": 37.268592834472656, "max_norm/layer19": 36.70490646362305, "max_norm/layer2": 25.953227996826172, "max_norm/layer20": 36.691898345947266, "max_norm/layer21": 36.96839904785156, "max_norm/layer22": 37.388004302978516, "max_norm/layer23": 35.4702262878418, "max_norm/layer3": 32.95038604736328, "max_norm/layer4": 32.99562454223633, "max_norm/layer5": 42.026756286621094, "max_norm/layer6": 27.448122024536133, "max_norm/layer7": 36.12428665161133, "max_norm/layer8": 35.01604080200195, "max_norm/layer9": 35.487979888916016, "mean_norm": 11.591110952198505, "mean_norm/layer0": 11.464677512645721, "mean_norm/layer1": 11.027840971946716, "mean_norm/layer10": 11.345887303352356, "mean_norm/layer11": 11.752020120620728, "mean_norm/layer12": 12.520609438419342, "mean_norm/layer13": 11.379559338092804, "mean_norm/layer14": 11.842145323753357, "mean_norm/layer15": 12.29226964712143, "mean_norm/layer16": 11.447559237480164, "mean_norm/layer17": 12.018401503562927, "mean_norm/layer18": 11.422959864139557, "mean_norm/layer19": 11.501260638237, "mean_norm/layer2": 9.178790748119354, "mean_norm/layer20": 11.605934798717499, "mean_norm/layer21": 11.574039816856384, "mean_norm/layer22": 12.816502630710602, "mean_norm/layer23": 12.771722674369812, "mean_norm/layer3": 12.298872590065002, "mean_norm/layer4": 10.697331547737122, "mean_norm/layer5": 13.838718593120575, "mean_norm/layer6": 10.060210466384888, "mean_norm/layer7": 10.731984496116638, "mean_norm/layer8": 11.345423817634583, "mean_norm/layer9": 11.25193977355957, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 13950 }, { "epoch": 5.82, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4698206803681305, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7006213665008545, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8275, "eval_samples_per_second": 22.258, "eval_steps_per_second": 0.739, "step": 13950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.85, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4341, "max_norm": 43.21664810180664, "max_norm/layer0": 32.8301887512207, "max_norm/layer1": 34.805118560791016, "max_norm/layer10": 36.62165832519531, "max_norm/layer11": 33.37471389770508, "max_norm/layer12": 38.779029846191406, "max_norm/layer13": 33.97347640991211, "max_norm/layer14": 34.97389221191406, "max_norm/layer15": 42.710960388183594, "max_norm/layer16": 35.09590148925781, "max_norm/layer17": 43.21664810180664, "max_norm/layer18": 37.33848571777344, "max_norm/layer19": 36.80155563354492, "max_norm/layer2": 26.006290435791016, "max_norm/layer20": 36.775001525878906, "max_norm/layer21": 37.05457305908203, "max_norm/layer22": 37.47380828857422, "max_norm/layer23": 35.542789459228516, "max_norm/layer3": 33.01007843017578, "max_norm/layer4": 33.06580352783203, "max_norm/layer5": 42.12410354614258, "max_norm/layer6": 27.502948760986328, "max_norm/layer7": 36.20676803588867, "max_norm/layer8": 35.10688781738281, "max_norm/layer9": 35.55755615234375, "mean_norm": 11.6008760035038, "mean_norm/layer0": 11.477870464324951, "mean_norm/layer1": 11.037355363368988, "mean_norm/layer10": 11.354801952838898, "mean_norm/layer11": 11.761891961097717, "mean_norm/layer12": 12.533324897289276, "mean_norm/layer13": 11.388908922672272, "mean_norm/layer14": 11.852356672286987, "mean_norm/layer15": 12.303934931755066, "mean_norm/layer16": 11.456604540348053, "mean_norm/layer17": 12.028372943401337, "mean_norm/layer18": 11.431184530258179, "mean_norm/layer19": 11.509862244129181, "mean_norm/layer2": 9.182381510734558, "mean_norm/layer20": 11.614325940608978, "mean_norm/layer21": 11.582619071006775, "mean_norm/layer22": 12.828144192695618, "mean_norm/layer23": 12.783535063266754, "mean_norm/layer3": 12.311726570129395, "mean_norm/layer4": 10.705096662044525, "mean_norm/layer5": 13.85563451051712, "mean_norm/layer6": 10.06605577468872, "mean_norm/layer7": 10.73960566520691, "mean_norm/layer8": 11.35459178686142, "mean_norm/layer9": 11.26083791255951, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14000 }, { "epoch": 5.85, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4700478212725569, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6960055828094482, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8363, "eval_samples_per_second": 20.361, "eval_steps_per_second": 0.676, "step": 14000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.87, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4387, "max_norm": 43.33818435668945, "max_norm/layer0": 32.90453338623047, "max_norm/layer1": 34.89594650268555, "max_norm/layer10": 36.70533752441406, "max_norm/layer11": 33.45826721191406, "max_norm/layer12": 38.879756927490234, "max_norm/layer13": 34.05232620239258, "max_norm/layer14": 35.064571380615234, "max_norm/layer15": 42.82941436767578, "max_norm/layer16": 35.18965530395508, "max_norm/layer17": 43.33818435668945, "max_norm/layer18": 37.43769073486328, "max_norm/layer19": 36.90222930908203, "max_norm/layer2": 26.053985595703125, "max_norm/layer20": 36.861148834228516, "max_norm/layer21": 37.14982223510742, "max_norm/layer22": 37.572227478027344, "max_norm/layer23": 35.62480545043945, "max_norm/layer3": 33.07106399536133, "max_norm/layer4": 33.13713836669922, "max_norm/layer5": 42.22083282470703, "max_norm/layer6": 27.555927276611328, "max_norm/layer7": 36.295875549316406, "max_norm/layer8": 35.1954345703125, "max_norm/layer9": 35.63373947143555, "mean_norm": 11.610697651902834, "mean_norm/layer0": 11.491089403629303, "mean_norm/layer1": 11.046924233436584, "mean_norm/layer10": 11.363676011562347, "mean_norm/layer11": 11.771858751773834, "mean_norm/layer12": 12.546132445335388, "mean_norm/layer13": 11.398319244384766, "mean_norm/layer14": 11.862588167190552, "mean_norm/layer15": 12.315575361251831, "mean_norm/layer16": 11.465714812278748, "mean_norm/layer17": 12.038424968719482, "mean_norm/layer18": 11.43947297334671, "mean_norm/layer19": 11.518530130386353, "mean_norm/layer2": 9.186090588569641, "mean_norm/layer20": 11.622918426990509, "mean_norm/layer21": 11.591268122196198, "mean_norm/layer22": 12.839798271656036, "mean_norm/layer23": 12.795412421226501, "mean_norm/layer3": 12.324716210365295, "mean_norm/layer4": 10.712847471237183, "mean_norm/layer5": 13.872604966163635, "mean_norm/layer6": 10.071965157985687, "mean_norm/layer7": 10.7472425699234, "mean_norm/layer8": 11.36383306980133, "mean_norm/layer9": 11.269739866256714, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14050 }, { "epoch": 5.87, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46974767079170776, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6960787773132324, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6345, "eval_samples_per_second": 20.714, "eval_steps_per_second": 0.688, "step": 14050 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.89, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4431, "max_norm": 43.441749572753906, "max_norm/layer0": 32.974632263183594, "max_norm/layer1": 34.989437103271484, "max_norm/layer10": 36.79485321044922, "max_norm/layer11": 33.53351974487305, "max_norm/layer12": 38.98495864868164, "max_norm/layer13": 34.13669967651367, "max_norm/layer14": 35.149986267089844, "max_norm/layer15": 42.9059944152832, "max_norm/layer16": 35.27094650268555, "max_norm/layer17": 43.441749572753906, "max_norm/layer18": 37.5269775390625, "max_norm/layer19": 36.99470901489258, "max_norm/layer2": 26.092681884765625, "max_norm/layer20": 36.94902038574219, "max_norm/layer21": 37.251434326171875, "max_norm/layer22": 37.671112060546875, "max_norm/layer23": 35.70341873168945, "max_norm/layer3": 33.13298416137695, "max_norm/layer4": 33.20835876464844, "max_norm/layer5": 42.318687438964844, "max_norm/layer6": 27.600130081176758, "max_norm/layer7": 36.378604888916016, "max_norm/layer8": 35.283470153808594, "max_norm/layer9": 35.7142219543457, "mean_norm": 11.620416504641375, "mean_norm/layer0": 11.5041783452034, "mean_norm/layer1": 11.056489646434784, "mean_norm/layer10": 11.372434675693512, "mean_norm/layer11": 11.781669199466705, "mean_norm/layer12": 12.558667540550232, "mean_norm/layer13": 11.407612383365631, "mean_norm/layer14": 11.872676074504852, "mean_norm/layer15": 12.327141106128693, "mean_norm/layer16": 11.474704504013062, "mean_norm/layer17": 12.04838103055954, "mean_norm/layer18": 11.447708785533905, "mean_norm/layer19": 11.527015447616577, "mean_norm/layer2": 9.189803123474121, "mean_norm/layer20": 11.631482064723969, "mean_norm/layer21": 11.599860608577728, "mean_norm/layer22": 12.851312100887299, "mean_norm/layer23": 12.807093441486359, "mean_norm/layer3": 12.337528228759766, "mean_norm/layer4": 10.720510184764862, "mean_norm/layer5": 13.889585733413696, "mean_norm/layer6": 10.077845275402069, "mean_norm/layer7": 10.75475662946701, "mean_norm/layer8": 11.372963190078735, "mean_norm/layer9": 11.278576791286469, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14100 }, { "epoch": 5.89, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47030335479003665, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6899490356445312, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8606, "eval_samples_per_second": 20.319, "eval_steps_per_second": 0.675, "step": 14100 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.91, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4324, "max_norm": 43.548465728759766, "max_norm/layer0": 33.051536560058594, "max_norm/layer1": 35.0789794921875, "max_norm/layer10": 36.88705062866211, "max_norm/layer11": 33.60562515258789, "max_norm/layer12": 39.086647033691406, "max_norm/layer13": 34.211490631103516, "max_norm/layer14": 35.24163818359375, "max_norm/layer15": 43.00029373168945, "max_norm/layer16": 35.36878967285156, "max_norm/layer17": 43.548465728759766, "max_norm/layer18": 37.62931823730469, "max_norm/layer19": 37.08994674682617, "max_norm/layer2": 26.14853858947754, "max_norm/layer20": 37.03773498535156, "max_norm/layer21": 37.34528732299805, "max_norm/layer22": 37.75578308105469, "max_norm/layer23": 35.7780647277832, "max_norm/layer3": 33.202308654785156, "max_norm/layer4": 33.26975631713867, "max_norm/layer5": 42.42267990112305, "max_norm/layer6": 27.656192779541016, "max_norm/layer7": 36.4588508605957, "max_norm/layer8": 35.362754821777344, "max_norm/layer9": 35.800048828125, "mean_norm": 11.630185887217522, "mean_norm/layer0": 11.517368972301483, "mean_norm/layer1": 11.066060483455658, "mean_norm/layer10": 11.381290197372437, "mean_norm/layer11": 11.791641652584076, "mean_norm/layer12": 12.57132887840271, "mean_norm/layer13": 11.416931986808777, "mean_norm/layer14": 11.882811486721039, "mean_norm/layer15": 12.338815450668335, "mean_norm/layer16": 11.483754396438599, "mean_norm/layer17": 12.058379352092743, "mean_norm/layer18": 11.456011533737183, "mean_norm/layer19": 11.535554885864258, "mean_norm/layer2": 9.193414986133575, "mean_norm/layer20": 11.639894902706146, "mean_norm/layer21": 11.608478248119354, "mean_norm/layer22": 12.862938106060028, "mean_norm/layer23": 12.818759024143219, "mean_norm/layer3": 12.350463688373566, "mean_norm/layer4": 10.728277564048767, "mean_norm/layer5": 13.906632900238037, "mean_norm/layer6": 10.083712875843048, "mean_norm/layer7": 10.76239389181137, "mean_norm/layer8": 11.382040023803711, "mean_norm/layer9": 11.287505805492401, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14150 }, { "epoch": 5.91, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47015327954961206, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6898772716522217, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6405, "eval_samples_per_second": 20.704, "eval_steps_per_second": 0.687, "step": 14150 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.93, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4488, "max_norm": 43.65976333618164, "max_norm/layer0": 33.13996124267578, "max_norm/layer1": 35.17390823364258, "max_norm/layer10": 36.97819137573242, "max_norm/layer11": 33.683189392089844, "max_norm/layer12": 39.19681930541992, "max_norm/layer13": 34.28578186035156, "max_norm/layer14": 35.341121673583984, "max_norm/layer15": 43.115135192871094, "max_norm/layer16": 35.4621696472168, "max_norm/layer17": 43.65976333618164, "max_norm/layer18": 37.73054122924805, "max_norm/layer19": 37.18355178833008, "max_norm/layer2": 26.213022232055664, "max_norm/layer20": 37.11777877807617, "max_norm/layer21": 37.44013595581055, "max_norm/layer22": 37.8612060546875, "max_norm/layer23": 35.86772155761719, "max_norm/layer3": 33.270999908447266, "max_norm/layer4": 33.32688903808594, "max_norm/layer5": 42.53396224975586, "max_norm/layer6": 27.718505859375, "max_norm/layer7": 36.53450012207031, "max_norm/layer8": 35.450984954833984, "max_norm/layer9": 35.87091827392578, "mean_norm": 11.639934313793978, "mean_norm/layer0": 11.53043419122696, "mean_norm/layer1": 11.07560282945633, "mean_norm/layer10": 11.390058994293213, "mean_norm/layer11": 11.80152678489685, "mean_norm/layer12": 12.583993315696716, "mean_norm/layer13": 11.426232159137726, "mean_norm/layer14": 11.89290964603424, "mean_norm/layer15": 12.35047596693039, "mean_norm/layer16": 11.492808818817139, "mean_norm/layer17": 12.068269491195679, "mean_norm/layer18": 11.464175939559937, "mean_norm/layer19": 11.544139325618744, "mean_norm/layer2": 9.197042524814606, "mean_norm/layer20": 11.648470103740692, "mean_norm/layer21": 11.617040514945984, "mean_norm/layer22": 12.874555885791779, "mean_norm/layer23": 12.830484867095947, "mean_norm/layer3": 12.363328337669373, "mean_norm/layer4": 10.736116528511047, "mean_norm/layer5": 13.923593997955322, "mean_norm/layer6": 10.089556813240051, "mean_norm/layer7": 10.770008206367493, "mean_norm/layer8": 11.39112776517868, "mean_norm/layer9": 11.296470522880554, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14200 }, { "epoch": 5.93, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.47055888830751635, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.69054913520813, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8311, "eval_samples_per_second": 20.37, "eval_steps_per_second": 0.676, "step": 14200 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.95, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4344, "max_norm": 43.770164489746094, "max_norm/layer0": 33.20868682861328, "max_norm/layer1": 35.26812744140625, "max_norm/layer10": 37.083702087402344, "max_norm/layer11": 33.75374984741211, "max_norm/layer12": 39.29998779296875, "max_norm/layer13": 34.36618423461914, "max_norm/layer14": 35.43849563598633, "max_norm/layer15": 43.22459411621094, "max_norm/layer16": 35.54741287231445, "max_norm/layer17": 43.770164489746094, "max_norm/layer18": 37.811466217041016, "max_norm/layer19": 37.2822380065918, "max_norm/layer2": 26.2640323638916, "max_norm/layer20": 37.19891357421875, "max_norm/layer21": 37.527061462402344, "max_norm/layer22": 37.950984954833984, "max_norm/layer23": 35.96153259277344, "max_norm/layer3": 33.3438606262207, "max_norm/layer4": 33.387088775634766, "max_norm/layer5": 42.64588165283203, "max_norm/layer6": 27.77462387084961, "max_norm/layer7": 36.612342834472656, "max_norm/layer8": 35.532344818115234, "max_norm/layer9": 35.93207550048828, "mean_norm": 11.649720599253973, "mean_norm/layer0": 11.54356062412262, "mean_norm/layer1": 11.084979772567749, "mean_norm/layer10": 11.398874163627625, "mean_norm/layer11": 11.811476826667786, "mean_norm/layer12": 12.596729159355164, "mean_norm/layer13": 11.4356250166893, "mean_norm/layer14": 11.903102099895477, "mean_norm/layer15": 12.362160086631775, "mean_norm/layer16": 11.501914262771606, "mean_norm/layer17": 12.078312635421753, "mean_norm/layer18": 11.47243356704712, "mean_norm/layer19": 11.55273050069809, "mean_norm/layer2": 9.200705409049988, "mean_norm/layer20": 11.65684986114502, "mean_norm/layer21": 11.6256822347641, "mean_norm/layer22": 12.886271953582764, "mean_norm/layer23": 12.842396259307861, "mean_norm/layer3": 12.376322150230408, "mean_norm/layer4": 10.743931829929352, "mean_norm/layer5": 13.940525889396667, "mean_norm/layer6": 10.095376551151276, "mean_norm/layer7": 10.777623057365417, "mean_norm/layer8": 11.400293707847595, "mean_norm/layer9": 11.305416762828827, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14250 }, { "epoch": 5.95, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4709604409778416, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.693927764892578, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8382, "eval_samples_per_second": 20.358, "eval_steps_per_second": 0.676, "step": 14250 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.97, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4414, "max_norm": 43.877471923828125, "max_norm/layer0": 33.2783317565918, "max_norm/layer1": 35.36090850830078, "max_norm/layer10": 37.202369689941406, "max_norm/layer11": 33.82597351074219, "max_norm/layer12": 39.39459991455078, "max_norm/layer13": 34.450408935546875, "max_norm/layer14": 35.524879455566406, "max_norm/layer15": 43.33192825317383, "max_norm/layer16": 35.63564682006836, "max_norm/layer17": 43.877471923828125, "max_norm/layer18": 37.90175247192383, "max_norm/layer19": 37.37932586669922, "max_norm/layer2": 26.314382553100586, "max_norm/layer20": 37.288143157958984, "max_norm/layer21": 37.59833526611328, "max_norm/layer22": 38.0389289855957, "max_norm/layer23": 36.04848098754883, "max_norm/layer3": 33.40947723388672, "max_norm/layer4": 33.448463439941406, "max_norm/layer5": 42.75556182861328, "max_norm/layer6": 27.835750579833984, "max_norm/layer7": 36.69871139526367, "max_norm/layer8": 35.61986541748047, "max_norm/layer9": 35.991172790527344, "mean_norm": 11.65939316401879, "mean_norm/layer0": 11.556526839733124, "mean_norm/layer1": 11.094407200813293, "mean_norm/layer10": 11.407621800899506, "mean_norm/layer11": 11.821186006069183, "mean_norm/layer12": 12.609242022037506, "mean_norm/layer13": 11.444914400577545, "mean_norm/layer14": 11.913126409053802, "mean_norm/layer15": 12.373706638813019, "mean_norm/layer16": 11.510907769203186, "mean_norm/layer17": 12.088223099708557, "mean_norm/layer18": 11.480640769004822, "mean_norm/layer19": 11.561327338218689, "mean_norm/layer2": 9.204297006130219, "mean_norm/layer20": 11.66532027721405, "mean_norm/layer21": 11.63420432806015, "mean_norm/layer22": 12.89782601594925, "mean_norm/layer23": 12.85407680273056, "mean_norm/layer3": 12.389108657836914, "mean_norm/layer4": 10.751596450805664, "mean_norm/layer5": 13.9572993516922, "mean_norm/layer6": 10.101068377494812, "mean_norm/layer7": 10.785195469856262, "mean_norm/layer8": 11.409336149692535, "mean_norm/layer9": 11.31427675485611, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14300 }, { "epoch": 5.97, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.471937958084391, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.687013626098633, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6223, "eval_samples_per_second": 20.736, "eval_steps_per_second": 0.688, "step": 14300 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 5.99, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.4437, "max_norm": 43.989898681640625, "max_norm/layer0": 33.34931564331055, "max_norm/layer1": 35.46033477783203, "max_norm/layer10": 37.316829681396484, "max_norm/layer11": 33.88945007324219, "max_norm/layer12": 39.5078125, "max_norm/layer13": 34.53520965576172, "max_norm/layer14": 35.60698699951172, "max_norm/layer15": 43.46208953857422, "max_norm/layer16": 35.72053527832031, "max_norm/layer17": 43.989898681640625, "max_norm/layer18": 37.99073028564453, "max_norm/layer19": 37.48189163208008, "max_norm/layer2": 26.361745834350586, "max_norm/layer20": 37.369483947753906, "max_norm/layer21": 37.68265151977539, "max_norm/layer22": 38.128868103027344, "max_norm/layer23": 36.1319465637207, "max_norm/layer3": 33.48076248168945, "max_norm/layer4": 33.50715255737305, "max_norm/layer5": 42.86227035522461, "max_norm/layer6": 27.901187896728516, "max_norm/layer7": 36.785762786865234, "max_norm/layer8": 35.692440032958984, "max_norm/layer9": 36.05787658691406, "mean_norm": 11.669073348244032, "mean_norm/layer0": 11.569561958312988, "mean_norm/layer1": 11.103819906711578, "mean_norm/layer10": 11.41639906167984, "mean_norm/layer11": 11.830869317054749, "mean_norm/layer12": 12.621800243854523, "mean_norm/layer13": 11.454206645488739, "mean_norm/layer14": 11.923109650611877, "mean_norm/layer15": 12.385221660137177, "mean_norm/layer16": 11.519890904426575, "mean_norm/layer17": 12.098167896270752, "mean_norm/layer18": 11.488867819309235, "mean_norm/layer19": 11.569864094257355, "mean_norm/layer2": 9.207905173301697, "mean_norm/layer20": 11.673797130584717, "mean_norm/layer21": 11.642704725265503, "mean_norm/layer22": 12.909379720687866, "mean_norm/layer23": 12.865759074687958, "mean_norm/layer3": 12.401918411254883, "mean_norm/layer4": 10.759348154067993, "mean_norm/layer5": 13.974067091941833, "mean_norm/layer6": 10.10683810710907, "mean_norm/layer7": 10.79275369644165, "mean_norm/layer8": 11.41837626695633, "mean_norm/layer9": 11.323133647441864, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14350 }, { "epoch": 5.99, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4716945928296484, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.6884405612945557, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8294, "eval_samples_per_second": 20.373, "eval_steps_per_second": 0.676, "step": 14350 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.01, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3129, "max_norm": 44.09721374511719, "max_norm/layer0": 33.424678802490234, "max_norm/layer1": 35.5435676574707, "max_norm/layer10": 37.4267578125, "max_norm/layer11": 33.97317123413086, "max_norm/layer12": 39.60700225830078, "max_norm/layer13": 34.626312255859375, "max_norm/layer14": 35.68148422241211, "max_norm/layer15": 43.590301513671875, "max_norm/layer16": 35.797027587890625, "max_norm/layer17": 44.09721374511719, "max_norm/layer18": 38.072628021240234, "max_norm/layer19": 37.573429107666016, "max_norm/layer2": 26.40358543395996, "max_norm/layer20": 37.452476501464844, "max_norm/layer21": 37.774017333984375, "max_norm/layer22": 38.23457717895508, "max_norm/layer23": 36.20406723022461, "max_norm/layer3": 33.54252243041992, "max_norm/layer4": 33.57847213745117, "max_norm/layer5": 42.95096969604492, "max_norm/layer6": 27.952163696289062, "max_norm/layer7": 36.872596740722656, "max_norm/layer8": 35.75625228881836, "max_norm/layer9": 36.12723922729492, "mean_norm": 11.678674280643463, "mean_norm/layer0": 11.582400023937225, "mean_norm/layer1": 11.113045513629913, "mean_norm/layer10": 11.425013542175293, "mean_norm/layer11": 11.840567767620087, "mean_norm/layer12": 12.634274005889893, "mean_norm/layer13": 11.463509678840637, "mean_norm/layer14": 11.933098912239075, "mean_norm/layer15": 12.396642088890076, "mean_norm/layer16": 11.528850138187408, "mean_norm/layer17": 12.10803872346878, "mean_norm/layer18": 11.497036457061768, "mean_norm/layer19": 11.578483283519745, "mean_norm/layer2": 9.21142292022705, "mean_norm/layer20": 11.682356297969818, "mean_norm/layer21": 11.651371657848358, "mean_norm/layer22": 12.920911967754364, "mean_norm/layer23": 12.877335011959076, "mean_norm/layer3": 12.414536356925964, "mean_norm/layer4": 10.766944766044617, "mean_norm/layer5": 13.990516602993011, "mean_norm/layer6": 10.112547993659973, "mean_norm/layer7": 10.800214946269989, "mean_norm/layer8": 11.427287995815277, "mean_norm/layer9": 11.331776082515717, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14400 }, { "epoch": 6.01, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46913520156727223, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7376086711883545, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6168, "eval_samples_per_second": 20.746, "eval_steps_per_second": 0.689, "step": 14400 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.03, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2464, "max_norm": 44.224796295166016, "max_norm/layer0": 33.49764633178711, "max_norm/layer1": 35.63376235961914, "max_norm/layer10": 37.52918243408203, "max_norm/layer11": 34.06564712524414, "max_norm/layer12": 39.712989807128906, "max_norm/layer13": 34.71847915649414, "max_norm/layer14": 35.767826080322266, "max_norm/layer15": 43.719058990478516, "max_norm/layer16": 35.88226318359375, "max_norm/layer17": 44.224796295166016, "max_norm/layer18": 38.1541633605957, "max_norm/layer19": 37.67153549194336, "max_norm/layer2": 26.451637268066406, "max_norm/layer20": 37.53163528442383, "max_norm/layer21": 37.86661148071289, "max_norm/layer22": 38.343509674072266, "max_norm/layer23": 36.274871826171875, "max_norm/layer3": 33.602134704589844, "max_norm/layer4": 33.64577102661133, "max_norm/layer5": 43.04342269897461, "max_norm/layer6": 28.01210594177246, "max_norm/layer7": 36.95952606201172, "max_norm/layer8": 35.837249755859375, "max_norm/layer9": 36.20220947265625, "mean_norm": 11.688791334629059, "mean_norm/layer0": 11.596086919307709, "mean_norm/layer1": 11.122628390789032, "mean_norm/layer10": 11.433982729911804, "mean_norm/layer11": 11.85074108839035, "mean_norm/layer12": 12.647378921508789, "mean_norm/layer13": 11.473222136497498, "mean_norm/layer14": 11.943670928478241, "mean_norm/layer15": 12.408711671829224, "mean_norm/layer16": 11.538374602794647, "mean_norm/layer17": 12.11855924129486, "mean_norm/layer18": 11.505737960338593, "mean_norm/layer19": 11.587811827659607, "mean_norm/layer2": 9.215099394321442, "mean_norm/layer20": 11.691645443439484, "mean_norm/layer21": 11.660697937011719, "mean_norm/layer22": 12.93289566040039, "mean_norm/layer23": 12.889711081981659, "mean_norm/layer3": 12.427682518959045, "mean_norm/layer4": 10.774953126907349, "mean_norm/layer5": 14.00755500793457, "mean_norm/layer6": 10.118492186069489, "mean_norm/layer7": 10.80799287557602, "mean_norm/layer8": 11.436597108840942, "mean_norm/layer9": 11.34076327085495, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14450 }, { "epoch": 6.03, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46790215094324317, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.740433931350708, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8406, "eval_samples_per_second": 20.354, "eval_steps_per_second": 0.676, "step": 14450 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.05, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2476, "max_norm": 44.33781433105469, "max_norm/layer0": 33.578407287597656, "max_norm/layer1": 35.71784591674805, "max_norm/layer10": 37.634239196777344, "max_norm/layer11": 34.15476989746094, "max_norm/layer12": 39.832733154296875, "max_norm/layer13": 34.81980895996094, "max_norm/layer14": 35.85801315307617, "max_norm/layer15": 43.835697174072266, "max_norm/layer16": 35.963539123535156, "max_norm/layer17": 44.33781433105469, "max_norm/layer18": 38.23371505737305, "max_norm/layer19": 37.796539306640625, "max_norm/layer2": 26.483850479125977, "max_norm/layer20": 37.608795166015625, "max_norm/layer21": 37.96210479736328, "max_norm/layer22": 38.45704650878906, "max_norm/layer23": 36.3537483215332, "max_norm/layer3": 33.67289352416992, "max_norm/layer4": 33.70362091064453, "max_norm/layer5": 43.14081954956055, "max_norm/layer6": 28.07660675048828, "max_norm/layer7": 37.03910827636719, "max_norm/layer8": 35.92915344238281, "max_norm/layer9": 36.28647994995117, "mean_norm": 11.698854426542917, "mean_norm/layer0": 11.610015153884888, "mean_norm/layer1": 11.13212662935257, "mean_norm/layer10": 11.442975342273712, "mean_norm/layer11": 11.860947608947754, "mean_norm/layer12": 12.660435795783997, "mean_norm/layer13": 11.48287183046341, "mean_norm/layer14": 11.95419842004776, "mean_norm/layer15": 12.420693695545197, "mean_norm/layer16": 11.547771215438843, "mean_norm/layer17": 12.128973543643951, "mean_norm/layer18": 11.514398634433746, "mean_norm/layer19": 11.597030580043793, "mean_norm/layer2": 9.21879118680954, "mean_norm/layer20": 11.70077121257782, "mean_norm/layer21": 11.669915497303009, "mean_norm/layer22": 12.944676518440247, "mean_norm/layer23": 12.901835203170776, "mean_norm/layer3": 12.440813302993774, "mean_norm/layer4": 10.78300029039383, "mean_norm/layer5": 14.02452540397644, "mean_norm/layer6": 10.124517142772675, "mean_norm/layer7": 10.815687239170074, "mean_norm/layer8": 11.445838451385498, "mean_norm/layer9": 11.349696338176727, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14500 }, { "epoch": 6.05, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46863630279505, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7320709228515625, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8508, "eval_samples_per_second": 20.336, "eval_steps_per_second": 0.675, "step": 14500 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.08, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2637, "max_norm": 44.466896057128906, "max_norm/layer0": 33.65315246582031, "max_norm/layer1": 35.79899597167969, "max_norm/layer10": 37.72567367553711, "max_norm/layer11": 34.24459457397461, "max_norm/layer12": 39.92678451538086, "max_norm/layer13": 34.91712188720703, "max_norm/layer14": 35.933841705322266, "max_norm/layer15": 43.96389389038086, "max_norm/layer16": 36.0675163269043, "max_norm/layer17": 44.466896057128906, "max_norm/layer18": 38.311832427978516, "max_norm/layer19": 37.89857864379883, "max_norm/layer2": 26.51372528076172, "max_norm/layer20": 37.69976806640625, "max_norm/layer21": 38.0622673034668, "max_norm/layer22": 38.56037521362305, "max_norm/layer23": 36.4434928894043, "max_norm/layer3": 33.747703552246094, "max_norm/layer4": 33.77354049682617, "max_norm/layer5": 43.23781204223633, "max_norm/layer6": 28.13241958618164, "max_norm/layer7": 37.13059997558594, "max_norm/layer8": 36.016422271728516, "max_norm/layer9": 36.36855697631836, "mean_norm": 11.708862346907457, "mean_norm/layer0": 11.624148964881897, "mean_norm/layer1": 11.141570508480072, "mean_norm/layer10": 11.451896965503693, "mean_norm/layer11": 11.871017575263977, "mean_norm/layer12": 12.673356175422668, "mean_norm/layer13": 11.492523610591888, "mean_norm/layer14": 11.964637100696564, "mean_norm/layer15": 12.432619631290436, "mean_norm/layer16": 11.557033240795135, "mean_norm/layer17": 12.139299035072327, "mean_norm/layer18": 11.52294272184372, "mean_norm/layer19": 11.606126606464386, "mean_norm/layer2": 9.222389996051788, "mean_norm/layer20": 11.709802210330963, "mean_norm/layer21": 11.679030537605286, "mean_norm/layer22": 12.956490218639374, "mean_norm/layer23": 12.913890182971954, "mean_norm/layer3": 12.453877091407776, "mean_norm/layer4": 10.790977239608765, "mean_norm/layer5": 14.041500270366669, "mean_norm/layer6": 10.130520582199097, "mean_norm/layer7": 10.823352634906769, "mean_norm/layer8": 11.455033659934998, "mean_norm/layer9": 11.358659565448761, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14550 }, { "epoch": 6.08, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46778858049102995, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7400739192962646, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6327, "eval_samples_per_second": 20.717, "eval_steps_per_second": 0.688, "step": 14550 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.1, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2673, "max_norm": 44.583953857421875, "max_norm/layer0": 33.732749938964844, "max_norm/layer1": 35.883670806884766, "max_norm/layer10": 37.817840576171875, "max_norm/layer11": 34.32735824584961, "max_norm/layer12": 40.04595184326172, "max_norm/layer13": 35.021026611328125, "max_norm/layer14": 36.01658630371094, "max_norm/layer15": 44.089717864990234, "max_norm/layer16": 36.161041259765625, "max_norm/layer17": 44.583953857421875, "max_norm/layer18": 38.40084457397461, "max_norm/layer19": 37.9990234375, "max_norm/layer2": 26.546798706054688, "max_norm/layer20": 37.787086486816406, "max_norm/layer21": 38.14870071411133, "max_norm/layer22": 38.677337646484375, "max_norm/layer23": 36.53557205200195, "max_norm/layer3": 33.816959381103516, "max_norm/layer4": 33.839500427246094, "max_norm/layer5": 43.33034133911133, "max_norm/layer6": 28.18335723876953, "max_norm/layer7": 37.20534896850586, "max_norm/layer8": 36.09880065917969, "max_norm/layer9": 36.45109939575195, "mean_norm": 11.718958477179209, "mean_norm/layer0": 11.638537287712097, "mean_norm/layer1": 11.151164829730988, "mean_norm/layer10": 11.460838198661804, "mean_norm/layer11": 11.881148874759674, "mean_norm/layer12": 12.686423182487488, "mean_norm/layer13": 11.502274334430695, "mean_norm/layer14": 11.975151538848877, "mean_norm/layer15": 12.444611430168152, "mean_norm/layer16": 11.566363215446472, "mean_norm/layer17": 12.149612188339233, "mean_norm/layer18": 11.531615495681763, "mean_norm/layer19": 11.615218698978424, "mean_norm/layer2": 9.226134121418, "mean_norm/layer20": 11.718867301940918, "mean_norm/layer21": 11.688138842582703, "mean_norm/layer22": 12.968413412570953, "mean_norm/layer23": 12.926041781902313, "mean_norm/layer3": 12.467107772827148, "mean_norm/layer4": 10.79892909526825, "mean_norm/layer5": 14.058703899383545, "mean_norm/layer6": 10.13658756017685, "mean_norm/layer7": 10.831100225448608, "mean_norm/layer8": 11.464323878288269, "mean_norm/layer9": 11.367696285247803, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14600 }, { "epoch": 6.1, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4664500715899458, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7531161308288574, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6421, "eval_samples_per_second": 20.701, "eval_steps_per_second": 0.687, "step": 14600 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.12, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2826, "max_norm": 44.69528579711914, "max_norm/layer0": 33.810848236083984, "max_norm/layer1": 35.97419357299805, "max_norm/layer10": 37.910186767578125, "max_norm/layer11": 34.40093994140625, "max_norm/layer12": 40.16526412963867, "max_norm/layer13": 35.1344108581543, "max_norm/layer14": 36.102210998535156, "max_norm/layer15": 44.21253967285156, "max_norm/layer16": 36.24266815185547, "max_norm/layer17": 44.69528579711914, "max_norm/layer18": 38.483097076416016, "max_norm/layer19": 38.10674285888672, "max_norm/layer2": 26.580692291259766, "max_norm/layer20": 37.87656021118164, "max_norm/layer21": 38.24087905883789, "max_norm/layer22": 38.77226257324219, "max_norm/layer23": 36.63397979736328, "max_norm/layer3": 33.88368225097656, "max_norm/layer4": 33.91764831542969, "max_norm/layer5": 43.41983413696289, "max_norm/layer6": 28.235586166381836, "max_norm/layer7": 37.27918243408203, "max_norm/layer8": 36.18343734741211, "max_norm/layer9": 36.5324821472168, "mean_norm": 11.72901346286138, "mean_norm/layer0": 11.652945280075073, "mean_norm/layer1": 11.160664916038513, "mean_norm/layer10": 11.469777524471283, "mean_norm/layer11": 11.891315817832947, "mean_norm/layer12": 12.6994588971138, "mean_norm/layer13": 11.511991381645203, "mean_norm/layer14": 11.985653817653656, "mean_norm/layer15": 12.45661973953247, "mean_norm/layer16": 11.575735986232758, "mean_norm/layer17": 12.159762263298035, "mean_norm/layer18": 11.540223777294159, "mean_norm/layer19": 11.624176979064941, "mean_norm/layer2": 9.229885399341583, "mean_norm/layer20": 11.727642595767975, "mean_norm/layer21": 11.697233855724335, "mean_norm/layer22": 12.980267107486725, "mean_norm/layer23": 12.938136041164398, "mean_norm/layer3": 12.480332374572754, "mean_norm/layer4": 10.80697101354599, "mean_norm/layer5": 14.075869083404541, "mean_norm/layer6": 10.142605304718018, "mean_norm/layer7": 10.838842630386353, "mean_norm/layer8": 11.4734987616539, "mean_norm/layer9": 11.376712560653687, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14650 }, { "epoch": 6.12, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4675654956741826, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7478952407836914, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6343, "eval_samples_per_second": 20.715, "eval_steps_per_second": 0.688, "step": 14650 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.14, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2803, "max_norm": 44.81999969482422, "max_norm/layer0": 33.90229415893555, "max_norm/layer1": 36.06707000732422, "max_norm/layer10": 38.000553131103516, "max_norm/layer11": 34.46437072753906, "max_norm/layer12": 40.27119445800781, "max_norm/layer13": 35.24424362182617, "max_norm/layer14": 36.18069076538086, "max_norm/layer15": 44.345882415771484, "max_norm/layer16": 36.323299407958984, "max_norm/layer17": 44.81999969482422, "max_norm/layer18": 38.57911682128906, "max_norm/layer19": 38.21243667602539, "max_norm/layer2": 26.61791229248047, "max_norm/layer20": 37.95322036743164, "max_norm/layer21": 38.327857971191406, "max_norm/layer22": 38.86759948730469, "max_norm/layer23": 36.73441696166992, "max_norm/layer3": 33.94342041015625, "max_norm/layer4": 33.98491668701172, "max_norm/layer5": 43.51378631591797, "max_norm/layer6": 28.28629493713379, "max_norm/layer7": 37.365936279296875, "max_norm/layer8": 36.26069641113281, "max_norm/layer9": 36.62409210205078, "mean_norm": 11.73909062643846, "mean_norm/layer0": 11.667441129684448, "mean_norm/layer1": 11.170315623283386, "mean_norm/layer10": 11.478734910488129, "mean_norm/layer11": 11.901362717151642, "mean_norm/layer12": 12.712479770183563, "mean_norm/layer13": 11.521682798862457, "mean_norm/layer14": 11.996141493320465, "mean_norm/layer15": 12.4685178399086, "mean_norm/layer16": 11.585081934928894, "mean_norm/layer17": 12.170037686824799, "mean_norm/layer18": 11.548860013484955, "mean_norm/layer19": 11.633151412010193, "mean_norm/layer2": 9.233680367469788, "mean_norm/layer20": 11.736494660377502, "mean_norm/layer21": 11.706235766410828, "mean_norm/layer22": 12.99212795495987, "mean_norm/layer23": 12.950253963470459, "mean_norm/layer3": 12.49367219209671, "mean_norm/layer4": 10.815063416957855, "mean_norm/layer5": 14.093105018138885, "mean_norm/layer6": 10.148611605167389, "mean_norm/layer7": 10.846603572368622, "mean_norm/layer8": 11.482750594615936, "mean_norm/layer9": 11.385768592357635, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14700 }, { "epoch": 6.14, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4669651947124842, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.744550943374634, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8594, "eval_samples_per_second": 20.321, "eval_steps_per_second": 0.675, "step": 14700 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.16, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.2888, "max_norm": 44.948341369628906, "max_norm/layer0": 33.99632263183594, "max_norm/layer1": 36.15312957763672, "max_norm/layer10": 38.092010498046875, "max_norm/layer11": 34.52595901489258, "max_norm/layer12": 40.37563705444336, "max_norm/layer13": 35.3314094543457, "max_norm/layer14": 36.26191711425781, "max_norm/layer15": 44.47978973388672, "max_norm/layer16": 36.41969299316406, "max_norm/layer17": 44.948341369628906, "max_norm/layer18": 38.67579650878906, "max_norm/layer19": 38.30149841308594, "max_norm/layer2": 26.659557342529297, "max_norm/layer20": 38.041748046875, "max_norm/layer21": 38.415489196777344, "max_norm/layer22": 38.947418212890625, "max_norm/layer23": 36.82078552246094, "max_norm/layer3": 34.01167678833008, "max_norm/layer4": 34.06661605834961, "max_norm/layer5": 43.61132049560547, "max_norm/layer6": 28.341476440429688, "max_norm/layer7": 37.45941925048828, "max_norm/layer8": 36.348426818847656, "max_norm/layer9": 36.70441436767578, "mean_norm": 11.749220199882984, "mean_norm/layer0": 11.682098507881165, "mean_norm/layer1": 11.180002629756927, "mean_norm/layer10": 11.487772464752197, "mean_norm/layer11": 11.911587059497833, "mean_norm/layer12": 12.725587904453278, "mean_norm/layer13": 11.531331658363342, "mean_norm/layer14": 12.006726801395416, "mean_norm/layer15": 12.48053240776062, "mean_norm/layer16": 11.594469606876373, "mean_norm/layer17": 12.180344343185425, "mean_norm/layer18": 11.557434797286987, "mean_norm/layer19": 11.642093479633331, "mean_norm/layer2": 9.237485826015472, "mean_norm/layer20": 11.745355069637299, "mean_norm/layer21": 11.715200185775757, "mean_norm/layer22": 13.004086434841156, "mean_norm/layer23": 12.962449193000793, "mean_norm/layer3": 12.507059156894684, "mean_norm/layer4": 10.823196411132812, "mean_norm/layer5": 14.110482037067413, "mean_norm/layer6": 10.154706180095673, "mean_norm/layer7": 10.854439437389374, "mean_norm/layer8": 11.492040276527405, "mean_norm/layer9": 11.394802927970886, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14750 }, { "epoch": 6.16, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.4657443123511923, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.750763416290283, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.67, "eval_samples_per_second": 20.651, "eval_steps_per_second": 0.686, "step": 14750 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.18, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.303, "max_norm": 45.073246002197266, "max_norm/layer0": 34.08710861206055, "max_norm/layer1": 36.244224548339844, "max_norm/layer10": 38.180023193359375, "max_norm/layer11": 34.58510971069336, "max_norm/layer12": 40.496421813964844, "max_norm/layer13": 35.42164993286133, "max_norm/layer14": 36.34925079345703, "max_norm/layer15": 44.600223541259766, "max_norm/layer16": 36.52353286743164, "max_norm/layer17": 45.073246002197266, "max_norm/layer18": 38.772789001464844, "max_norm/layer19": 38.385990142822266, "max_norm/layer2": 26.702438354492188, "max_norm/layer20": 38.13774871826172, "max_norm/layer21": 38.51622009277344, "max_norm/layer22": 39.0334358215332, "max_norm/layer23": 36.904296875, "max_norm/layer3": 34.07844543457031, "max_norm/layer4": 34.143314361572266, "max_norm/layer5": 43.70988845825195, "max_norm/layer6": 28.39101219177246, "max_norm/layer7": 37.5562629699707, "max_norm/layer8": 36.42280578613281, "max_norm/layer9": 36.77370071411133, "mean_norm": 11.759335647026697, "mean_norm/layer0": 11.696792960166931, "mean_norm/layer1": 11.189741432666779, "mean_norm/layer10": 11.496793627738953, "mean_norm/layer11": 11.921910107135773, "mean_norm/layer12": 12.73866891860962, "mean_norm/layer13": 11.541031777858734, "mean_norm/layer14": 12.017287492752075, "mean_norm/layer15": 12.492536306381226, "mean_norm/layer16": 11.603844463825226, "mean_norm/layer17": 12.190562188625336, "mean_norm/layer18": 11.566004931926727, "mean_norm/layer19": 11.651012122631073, "mean_norm/layer2": 9.241271734237671, "mean_norm/layer20": 11.754229307174683, "mean_norm/layer21": 11.724102795124054, "mean_norm/layer22": 13.015969455242157, "mean_norm/layer23": 12.974500477313995, "mean_norm/layer3": 12.520442187786102, "mean_norm/layer4": 10.831291019916534, "mean_norm/layer5": 14.127792298793793, "mean_norm/layer6": 10.160741567611694, "mean_norm/layer7": 10.862253546714783, "mean_norm/layer8": 11.501340448856354, "mean_norm/layer9": 11.403934359550476, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14800 }, { "epoch": 6.18, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46723289649270106, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.738095283508301, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6524, "eval_samples_per_second": 20.683, "eval_steps_per_second": 0.687, "step": 14800 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.2, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3071, "max_norm": 45.186065673828125, "max_norm/layer0": 34.180145263671875, "max_norm/layer1": 36.340614318847656, "max_norm/layer10": 38.263370513916016, "max_norm/layer11": 34.65528106689453, "max_norm/layer12": 40.61335754394531, "max_norm/layer13": 35.51411437988281, "max_norm/layer14": 36.4224739074707, "max_norm/layer15": 44.72835159301758, "max_norm/layer16": 36.632625579833984, "max_norm/layer17": 45.186065673828125, "max_norm/layer18": 38.86900329589844, "max_norm/layer19": 38.483543395996094, "max_norm/layer2": 26.746105194091797, "max_norm/layer20": 38.22907638549805, "max_norm/layer21": 38.60087203979492, "max_norm/layer22": 39.13743591308594, "max_norm/layer23": 36.99153518676758, "max_norm/layer3": 34.13496017456055, "max_norm/layer4": 34.21876525878906, "max_norm/layer5": 43.80707931518555, "max_norm/layer6": 28.444496154785156, "max_norm/layer7": 37.6572380065918, "max_norm/layer8": 36.48862075805664, "max_norm/layer9": 36.847434997558594, "mean_norm": 11.769410625100136, "mean_norm/layer0": 11.71136349439621, "mean_norm/layer1": 11.19951182603836, "mean_norm/layer10": 11.505762279033661, "mean_norm/layer11": 11.932011187076569, "mean_norm/layer12": 12.751639366149902, "mean_norm/layer13": 11.550610899925232, "mean_norm/layer14": 12.027763426303864, "mean_norm/layer15": 12.504477262496948, "mean_norm/layer16": 11.613188326358795, "mean_norm/layer17": 12.20076310634613, "mean_norm/layer18": 11.574527025222778, "mean_norm/layer19": 11.660000503063202, "mean_norm/layer2": 9.245114207267761, "mean_norm/layer20": 11.763050854206085, "mean_norm/layer21": 11.733014643192291, "mean_norm/layer22": 13.027836441993713, "mean_norm/layer23": 12.986533343791962, "mean_norm/layer3": 12.533765077590942, "mean_norm/layer4": 10.839352071285248, "mean_norm/layer5": 14.145084381103516, "mean_norm/layer6": 10.166761040687561, "mean_norm/layer7": 10.870099246501923, "mean_norm/layer8": 11.51064658164978, "mean_norm/layer9": 11.412978410720825, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14850 }, { "epoch": 6.2, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46671371728258354, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7497682571411133, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 10.8261, "eval_samples_per_second": 22.261, "eval_steps_per_second": 0.739, "step": 14850 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.22, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3014, "max_norm": 45.308223724365234, "max_norm/layer0": 34.267417907714844, "max_norm/layer1": 36.43744659423828, "max_norm/layer10": 38.35849380493164, "max_norm/layer11": 34.72025680541992, "max_norm/layer12": 40.71356201171875, "max_norm/layer13": 35.608646392822266, "max_norm/layer14": 36.5001220703125, "max_norm/layer15": 44.83946228027344, "max_norm/layer16": 36.73179244995117, "max_norm/layer17": 45.308223724365234, "max_norm/layer18": 38.9741325378418, "max_norm/layer19": 38.586544036865234, "max_norm/layer2": 26.78317642211914, "max_norm/layer20": 38.316619873046875, "max_norm/layer21": 38.68571853637695, "max_norm/layer22": 39.225032806396484, "max_norm/layer23": 37.06938171386719, "max_norm/layer3": 34.203548431396484, "max_norm/layer4": 34.2883415222168, "max_norm/layer5": 43.896480560302734, "max_norm/layer6": 28.498565673828125, "max_norm/layer7": 37.7492790222168, "max_norm/layer8": 36.55672073364258, "max_norm/layer9": 36.92335891723633, "mean_norm": 11.779515077670416, "mean_norm/layer0": 11.726049065589905, "mean_norm/layer1": 11.209324061870575, "mean_norm/layer10": 11.514764368534088, "mean_norm/layer11": 11.942122519016266, "mean_norm/layer12": 12.764708518981934, "mean_norm/layer13": 11.560275077819824, "mean_norm/layer14": 12.038271605968475, "mean_norm/layer15": 12.51647001504898, "mean_norm/layer16": 11.622543811798096, "mean_norm/layer17": 12.210929572582245, "mean_norm/layer18": 11.583010852336884, "mean_norm/layer19": 11.668940365314484, "mean_norm/layer2": 9.248961925506592, "mean_norm/layer20": 11.771803140640259, "mean_norm/layer21": 11.74181979894638, "mean_norm/layer22": 13.039653956890106, "mean_norm/layer23": 12.998541593551636, "mean_norm/layer3": 12.547242283821106, "mean_norm/layer4": 10.84747463464737, "mean_norm/layer5": 14.16251653432846, "mean_norm/layer6": 10.172904789447784, "mean_norm/layer7": 10.877913773059845, "mean_norm/layer8": 11.520046174526215, "mean_norm/layer9": 11.422073423862457, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14900 }, { "epoch": 6.22, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46574025626361326, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.743490219116211, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.8386, "eval_samples_per_second": 20.357, "eval_steps_per_second": 0.676, "step": 14900 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.24, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3088, "max_norm": 45.41685104370117, "max_norm/layer0": 34.35284423828125, "max_norm/layer1": 36.526798248291016, "max_norm/layer10": 38.4525146484375, "max_norm/layer11": 34.7932243347168, "max_norm/layer12": 40.7994499206543, "max_norm/layer13": 35.694664001464844, "max_norm/layer14": 36.587955474853516, "max_norm/layer15": 44.962310791015625, "max_norm/layer16": 36.83222198486328, "max_norm/layer17": 45.41685104370117, "max_norm/layer18": 39.11237335205078, "max_norm/layer19": 38.691707611083984, "max_norm/layer2": 26.809534072875977, "max_norm/layer20": 38.412635803222656, "max_norm/layer21": 38.78028869628906, "max_norm/layer22": 39.322757720947266, "max_norm/layer23": 37.13923263549805, "max_norm/layer3": 34.273311614990234, "max_norm/layer4": 34.368839263916016, "max_norm/layer5": 43.9959716796875, "max_norm/layer6": 28.55388832092285, "max_norm/layer7": 37.8399658203125, "max_norm/layer8": 36.626319885253906, "max_norm/layer9": 36.991241455078125, "mean_norm": 11.789648773769537, "mean_norm/layer0": 11.740796387195587, "mean_norm/layer1": 11.219213783740997, "mean_norm/layer10": 11.523796737194061, "mean_norm/layer11": 11.952241718769073, "mean_norm/layer12": 12.777762591838837, "mean_norm/layer13": 11.569939851760864, "mean_norm/layer14": 12.048766016960144, "mean_norm/layer15": 12.528478980064392, "mean_norm/layer16": 11.63189560174942, "mean_norm/layer17": 12.221157014369965, "mean_norm/layer18": 11.591578304767609, "mean_norm/layer19": 11.6779265999794, "mean_norm/layer2": 9.252777576446533, "mean_norm/layer20": 11.780601918697357, "mean_norm/layer21": 11.750674307346344, "mean_norm/layer22": 13.051563382148743, "mean_norm/layer23": 13.010630786418915, "mean_norm/layer3": 12.56077265739441, "mean_norm/layer4": 10.855627298355103, "mean_norm/layer5": 14.179958462715149, "mean_norm/layer6": 10.179086148738861, "mean_norm/layer7": 10.885732650756836, "mean_norm/layer8": 11.529394507408142, "mean_norm/layer9": 11.43119728565216, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 14950 }, { "epoch": 6.24, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46645818376510384, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7555625438690186, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6207, "eval_samples_per_second": 20.739, "eval_steps_per_second": 0.688, "step": 14950 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.26, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "learning_rate": 0.0005, "loss": 2.3235, "max_norm": 45.539119720458984, "max_norm/layer0": 34.44173049926758, "max_norm/layer1": 36.61558151245117, "max_norm/layer10": 38.54380416870117, "max_norm/layer11": 34.865203857421875, "max_norm/layer12": 40.908504486083984, "max_norm/layer13": 35.78108215332031, "max_norm/layer14": 36.67228317260742, "max_norm/layer15": 45.083438873291016, "max_norm/layer16": 36.927913665771484, "max_norm/layer17": 45.539119720458984, "max_norm/layer18": 39.2352409362793, "max_norm/layer19": 38.779598236083984, "max_norm/layer2": 26.836795806884766, "max_norm/layer20": 38.50577163696289, "max_norm/layer21": 38.87571334838867, "max_norm/layer22": 39.42427062988281, "max_norm/layer23": 37.21847915649414, "max_norm/layer3": 34.34575271606445, "max_norm/layer4": 34.4432258605957, "max_norm/layer5": 44.077754974365234, "max_norm/layer6": 28.6057071685791, "max_norm/layer7": 37.91745376586914, "max_norm/layer8": 36.69032287597656, "max_norm/layer9": 37.08796691894531, "mean_norm": 11.799732064207396, "mean_norm/layer0": 11.755437850952148, "mean_norm/layer1": 11.22901839017868, "mean_norm/layer10": 11.532833635807037, "mean_norm/layer11": 11.962444841861725, "mean_norm/layer12": 12.79077160358429, "mean_norm/layer13": 11.57960969209671, "mean_norm/layer14": 12.059264957904816, "mean_norm/layer15": 12.540440499782562, "mean_norm/layer16": 11.641206741333008, "mean_norm/layer17": 12.231300234794617, "mean_norm/layer18": 11.600049555301666, "mean_norm/layer19": 11.686796128749847, "mean_norm/layer2": 9.256644666194916, "mean_norm/layer20": 11.78922188282013, "mean_norm/layer21": 11.759462356567383, "mean_norm/layer22": 13.063357532024384, "mean_norm/layer23": 13.022553265094757, "mean_norm/layer3": 12.574194192886353, "mean_norm/layer4": 10.863756775856018, "mean_norm/layer5": 14.197384178638458, "mean_norm/layer6": 10.185243308544159, "mean_norm/layer7": 10.893572747707367, "mean_norm/layer8": 11.53871750831604, "mean_norm/layer9": 11.440286993980408, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 15000 }, { "epoch": 6.26, "eval_MSE/layer0": 0.0, "eval_MSE/layer1": 0.0, "eval_MSE/layer10": 0.0, "eval_MSE/layer11": 0.0, "eval_MSE/layer12": 0.0, "eval_MSE/layer13": 0.0, "eval_MSE/layer14": 0.0, "eval_MSE/layer15": 0.0, "eval_MSE/layer16": 0.0, "eval_MSE/layer17": 0.0, "eval_MSE/layer18": 0.0, "eval_MSE/layer19": 0.0, "eval_MSE/layer2": 0.0, "eval_MSE/layer20": 0.0, "eval_MSE/layer21": 0.0, "eval_MSE/layer22": 0.0, "eval_MSE/layer23": 0.0, "eval_MSE/layer3": 0.0, "eval_MSE/layer4": 0.0, "eval_MSE/layer5": 0.0, "eval_MSE/layer6": 0.0, "eval_MSE/layer7": 0.0, "eval_MSE/layer8": 0.0, "eval_MSE/layer9": 0.0, "eval_accuracy": 0.46677861468384824, "eval_dead_code_fraction/layer0": 1.0, "eval_dead_code_fraction/layer1": 1.0, "eval_dead_code_fraction/layer10": 1.0, "eval_dead_code_fraction/layer11": 1.0, "eval_dead_code_fraction/layer12": 1.0, "eval_dead_code_fraction/layer13": 1.0, "eval_dead_code_fraction/layer14": 1.0, "eval_dead_code_fraction/layer15": 1.0, "eval_dead_code_fraction/layer16": 1.0, "eval_dead_code_fraction/layer17": 1.0, "eval_dead_code_fraction/layer18": 1.0, "eval_dead_code_fraction/layer19": 1.0, "eval_dead_code_fraction/layer2": 1.0, "eval_dead_code_fraction/layer20": 1.0, "eval_dead_code_fraction/layer21": 1.0, "eval_dead_code_fraction/layer22": 1.0, "eval_dead_code_fraction/layer23": 1.0, "eval_dead_code_fraction/layer3": 1.0, "eval_dead_code_fraction/layer4": 1.0, "eval_dead_code_fraction/layer5": 1.0, "eval_dead_code_fraction/layer6": 1.0, "eval_dead_code_fraction/layer7": 1.0, "eval_dead_code_fraction/layer8": 1.0, "eval_dead_code_fraction/layer9": 1.0, "eval_input_norm/layer0": 0.0, "eval_input_norm/layer1": 0.0, "eval_input_norm/layer10": 0.0, "eval_input_norm/layer11": 0.0, "eval_input_norm/layer12": 0.0, "eval_input_norm/layer13": 0.0, "eval_input_norm/layer14": 0.0, "eval_input_norm/layer15": 0.0, "eval_input_norm/layer16": 0.0, "eval_input_norm/layer17": 0.0, "eval_input_norm/layer18": 0.0, "eval_input_norm/layer19": 0.0, "eval_input_norm/layer2": 0.0, "eval_input_norm/layer20": 0.0, "eval_input_norm/layer21": 0.0, "eval_input_norm/layer22": 0.0, "eval_input_norm/layer23": 0.0, "eval_input_norm/layer3": 0.0, "eval_input_norm/layer4": 0.0, "eval_input_norm/layer5": 0.0, "eval_input_norm/layer6": 0.0, "eval_input_norm/layer7": 0.0, "eval_input_norm/layer8": 0.0, "eval_input_norm/layer9": 0.0, "eval_loss": 2.7446389198303223, "eval_multicode_k": 8, "eval_output_norm/layer0": 0.0, "eval_output_norm/layer1": 0.0, "eval_output_norm/layer10": 0.0, "eval_output_norm/layer11": 0.0, "eval_output_norm/layer12": 0.0, "eval_output_norm/layer13": 0.0, "eval_output_norm/layer14": 0.0, "eval_output_norm/layer15": 0.0, "eval_output_norm/layer16": 0.0, "eval_output_norm/layer17": 0.0, "eval_output_norm/layer18": 0.0, "eval_output_norm/layer19": 0.0, "eval_output_norm/layer2": 0.0, "eval_output_norm/layer20": 0.0, "eval_output_norm/layer21": 0.0, "eval_output_norm/layer22": 0.0, "eval_output_norm/layer23": 0.0, "eval_output_norm/layer3": 0.0, "eval_output_norm/layer4": 0.0, "eval_output_norm/layer5": 0.0, "eval_output_norm/layer6": 0.0, "eval_output_norm/layer7": 0.0, "eval_output_norm/layer8": 0.0, "eval_output_norm/layer9": 0.0, "eval_runtime": 11.6412, "eval_samples_per_second": 20.702, "eval_steps_per_second": 0.687, "step": 15000 }, { "MSE": 0.0, "MSE/layer0": 0.0, "MSE/layer1": 0.0, "MSE/layer10": 0.0, "MSE/layer11": 0.0, "MSE/layer12": 0.0, "MSE/layer13": 0.0, "MSE/layer14": 0.0, "MSE/layer15": 0.0, "MSE/layer16": 0.0, "MSE/layer17": 0.0, "MSE/layer18": 0.0, "MSE/layer19": 0.0, "MSE/layer2": 0.0, "MSE/layer20": 0.0, "MSE/layer21": 0.0, "MSE/layer22": 0.0, "MSE/layer23": 0.0, "MSE/layer3": 0.0, "MSE/layer4": 0.0, "MSE/layer5": 0.0, "MSE/layer6": 0.0, "MSE/layer7": 0.0, "MSE/layer8": 0.0, "MSE/layer9": 0.0, "dead_code_fraction": 1.0, "dead_code_fraction/layer0": 1.0, "dead_code_fraction/layer1": 1.0, "dead_code_fraction/layer10": 1.0, "dead_code_fraction/layer11": 1.0, "dead_code_fraction/layer12": 1.0, "dead_code_fraction/layer13": 1.0, "dead_code_fraction/layer14": 1.0, "dead_code_fraction/layer15": 1.0, "dead_code_fraction/layer16": 1.0, "dead_code_fraction/layer17": 1.0, "dead_code_fraction/layer18": 1.0, "dead_code_fraction/layer19": 1.0, "dead_code_fraction/layer2": 1.0, "dead_code_fraction/layer20": 1.0, "dead_code_fraction/layer21": 1.0, "dead_code_fraction/layer22": 1.0, "dead_code_fraction/layer23": 1.0, "dead_code_fraction/layer3": 1.0, "dead_code_fraction/layer4": 1.0, "dead_code_fraction/layer5": 1.0, "dead_code_fraction/layer6": 1.0, "dead_code_fraction/layer7": 1.0, "dead_code_fraction/layer8": 1.0, "dead_code_fraction/layer9": 1.0, "epoch": 6.26, "input_norm": 0.0, "input_norm/layer0": 0.0, "input_norm/layer1": 0.0, "input_norm/layer10": 0.0, "input_norm/layer11": 0.0, "input_norm/layer12": 0.0, "input_norm/layer13": 0.0, "input_norm/layer14": 0.0, "input_norm/layer15": 0.0, "input_norm/layer16": 0.0, "input_norm/layer17": 0.0, "input_norm/layer18": 0.0, "input_norm/layer19": 0.0, "input_norm/layer2": 0.0, "input_norm/layer20": 0.0, "input_norm/layer21": 0.0, "input_norm/layer22": 0.0, "input_norm/layer23": 0.0, "input_norm/layer3": 0.0, "input_norm/layer4": 0.0, "input_norm/layer5": 0.0, "input_norm/layer6": 0.0, "input_norm/layer7": 0.0, "input_norm/layer8": 0.0, "input_norm/layer9": 0.0, "max_norm": 45.539119720458984, "max_norm/layer0": 34.44173049926758, "max_norm/layer1": 36.61558151245117, "max_norm/layer10": 38.54380416870117, "max_norm/layer11": 34.865203857421875, "max_norm/layer12": 40.908504486083984, "max_norm/layer13": 35.78108215332031, "max_norm/layer14": 36.67228317260742, "max_norm/layer15": 45.083438873291016, "max_norm/layer16": 36.927913665771484, "max_norm/layer17": 45.539119720458984, "max_norm/layer18": 39.2352409362793, "max_norm/layer19": 38.779598236083984, "max_norm/layer2": 26.836795806884766, "max_norm/layer20": 38.50577163696289, "max_norm/layer21": 38.87571334838867, "max_norm/layer22": 39.42427062988281, "max_norm/layer23": 37.21847915649414, "max_norm/layer3": 34.34575271606445, "max_norm/layer4": 34.4432258605957, "max_norm/layer5": 44.077754974365234, "max_norm/layer6": 28.6057071685791, "max_norm/layer7": 37.91745376586914, "max_norm/layer8": 36.69032287597656, "max_norm/layer9": 37.08796691894531, "mean_norm": 11.799732064207396, "mean_norm/layer0": 11.755437850952148, "mean_norm/layer1": 11.22901839017868, "mean_norm/layer10": 11.532833635807037, "mean_norm/layer11": 11.962444841861725, "mean_norm/layer12": 12.79077160358429, "mean_norm/layer13": 11.57960969209671, "mean_norm/layer14": 12.059264957904816, "mean_norm/layer15": 12.540440499782562, "mean_norm/layer16": 11.641206741333008, "mean_norm/layer17": 12.231300234794617, "mean_norm/layer18": 11.600049555301666, "mean_norm/layer19": 11.686796128749847, "mean_norm/layer2": 9.256644666194916, "mean_norm/layer20": 11.78922188282013, "mean_norm/layer21": 11.759462356567383, "mean_norm/layer22": 13.063357532024384, "mean_norm/layer23": 13.022553265094757, "mean_norm/layer3": 12.574194192886353, "mean_norm/layer4": 10.863756775856018, "mean_norm/layer5": 14.197384178638458, "mean_norm/layer6": 10.185243308544159, "mean_norm/layer7": 10.893572747707367, "mean_norm/layer8": 11.53871750831604, "mean_norm/layer9": 11.440286993980408, "multicode_k": 8, "output_norm": 0.0, "output_norm/layer0": 0.0, "output_norm/layer1": 0.0, "output_norm/layer10": 0.0, "output_norm/layer11": 0.0, "output_norm/layer12": 0.0, "output_norm/layer13": 0.0, "output_norm/layer14": 0.0, "output_norm/layer15": 0.0, "output_norm/layer16": 0.0, "output_norm/layer17": 0.0, "output_norm/layer18": 0.0, "output_norm/layer19": 0.0, "output_norm/layer2": 0.0, "output_norm/layer20": 0.0, "output_norm/layer21": 0.0, "output_norm/layer22": 0.0, "output_norm/layer23": 0.0, "output_norm/layer3": 0.0, "output_norm/layer4": 0.0, "output_norm/layer5": 0.0, "output_norm/layer6": 0.0, "output_norm/layer7": 0.0, "output_norm/layer8": 0.0, "output_norm/layer9": 0.0, "step": 15000, "total_flos": 1.5651549796420813e+18, "train_loss": 2.685329116312663, "train_runtime": 43939.9354, "train_samples_per_second": 16.386, "train_steps_per_second": 0.341 } ], "max_steps": 15000, "num_train_epochs": 7, "total_flos": 1.5651549796420813e+18, "trial_name": null, "trial_params": null }