diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,79233 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 6.263048016701461, + "global_step": 15000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.0, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 10.4479, + "max_norm": 11.935791969299316, + "max_norm/layer0": 11.528828620910645, + "max_norm/layer1": 11.179052352905273, + "max_norm/layer10": 11.443963050842285, + "max_norm/layer11": 11.457213401794434, + "max_norm/layer12": 11.09423828125, + "max_norm/layer13": 10.991622924804688, + "max_norm/layer14": 11.824307441711426, + "max_norm/layer15": 11.151399612426758, + "max_norm/layer16": 10.765336990356445, + "max_norm/layer17": 11.6915922164917, + "max_norm/layer18": 11.321767807006836, + "max_norm/layer19": 11.388019561767578, + "max_norm/layer2": 11.24202823638916, + "max_norm/layer20": 11.28963851928711, + "max_norm/layer21": 11.935791969299316, + "max_norm/layer22": 11.426197052001953, + "max_norm/layer23": 11.311007499694824, + "max_norm/layer3": 11.2095308303833, + "max_norm/layer4": 11.231363296508789, + "max_norm/layer5": 11.49493408203125, + "max_norm/layer6": 11.883358001708984, + "max_norm/layer7": 11.410587310791016, + "max_norm/layer8": 11.1673002243042, + "max_norm/layer9": 11.320834159851074, + "mean_norm": 7.9688674112161, + "mean_norm/layer0": 7.968748152256012, + "mean_norm/layer1": 7.968711107969284, + "mean_norm/layer10": 7.96820729970932, + "mean_norm/layer11": 7.968186259269714, + "mean_norm/layer12": 7.971881151199341, + "mean_norm/layer13": 7.9677393436431885, + "mean_norm/layer14": 7.970236927270889, + "mean_norm/layer15": 7.966938257217407, + "mean_norm/layer16": 7.970880895853043, + "mean_norm/layer17": 7.967200756072998, + "mean_norm/layer18": 7.965942770242691, + "mean_norm/layer19": 7.964955180883408, + "mean_norm/layer2": 7.967412292957306, + "mean_norm/layer20": 7.969712853431702, + "mean_norm/layer21": 7.970251560211182, + "mean_norm/layer22": 7.968287110328674, + "mean_norm/layer23": 7.970414459705353, + "mean_norm/layer3": 7.969215750694275, + "mean_norm/layer4": 7.969323754310608, + "mean_norm/layer5": 7.97068253159523, + "mean_norm/layer6": 7.97090882062912, + "mean_norm/layer7": 7.968297064304352, + "mean_norm/layer8": 7.970566779375076, + "mean_norm/layer9": 7.968116790056229, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.02, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 7.6233, + "max_norm": 11.93603801727295, + "max_norm/layer0": 11.531795501708984, + "max_norm/layer1": 11.179537773132324, + "max_norm/layer10": 11.448348045349121, + "max_norm/layer11": 11.457023620605469, + "max_norm/layer12": 11.094408988952637, + "max_norm/layer13": 10.990287780761719, + "max_norm/layer14": 11.82107925415039, + "max_norm/layer15": 11.15367603302002, + "max_norm/layer16": 10.769166946411133, + "max_norm/layer17": 11.686759948730469, + "max_norm/layer18": 11.32666301727295, + "max_norm/layer19": 11.391281127929688, + "max_norm/layer2": 11.241073608398438, + "max_norm/layer20": 11.291045188903809, + "max_norm/layer21": 11.93603801727295, + "max_norm/layer22": 11.42624282836914, + "max_norm/layer23": 11.311007499694824, + "max_norm/layer3": 11.2095308303833, + "max_norm/layer4": 11.232872009277344, + "max_norm/layer5": 11.487099647521973, + "max_norm/layer6": 11.881125450134277, + "max_norm/layer7": 11.410587310791016, + "max_norm/layer8": 11.176557540893555, + "max_norm/layer9": 11.321023941040039, + "mean_norm": 7.971554110447566, + "mean_norm/layer0": 7.994439959526062, + "mean_norm/layer1": 7.975339025259018, + "mean_norm/layer10": 7.969327986240387, + "mean_norm/layer11": 7.969180196523666, + "mean_norm/layer12": 7.972845375537872, + "mean_norm/layer13": 7.968711882829666, + "mean_norm/layer14": 7.971314698457718, + "mean_norm/layer15": 7.9680851101875305, + "mean_norm/layer16": 7.971889913082123, + "mean_norm/layer17": 7.968462765216827, + "mean_norm/layer18": 7.966999590396881, + "mean_norm/layer19": 7.9660108387470245, + "mean_norm/layer2": 7.969779163599014, + "mean_norm/layer20": 7.9709367752075195, + "mean_norm/layer21": 7.971419245004654, + "mean_norm/layer22": 7.969498664140701, + "mean_norm/layer23": 7.971314489841461, + "mean_norm/layer3": 7.973078697919846, + "mean_norm/layer4": 7.971539229154587, + "mean_norm/layer5": 7.973774015903473, + "mean_norm/layer6": 7.972526788711548, + "mean_norm/layer7": 7.969632714986801, + "mean_norm/layer8": 7.971796870231628, + "mean_norm/layer9": 7.969394654035568, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 50 + }, + { + "epoch": 0.02, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.1632291324434277, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 5.859389781951904, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8439, + "eval_samples_per_second": 20.348, + "eval_steps_per_second": 0.675, + "step": 50 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.04, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 4.8681, + "max_norm": 11.938570022583008, + "max_norm/layer0": 11.561639785766602, + "max_norm/layer1": 11.204116821289062, + "max_norm/layer10": 11.462130546569824, + "max_norm/layer11": 11.474141120910645, + "max_norm/layer12": 11.094062805175781, + "max_norm/layer13": 11.00002670288086, + "max_norm/layer14": 11.826424598693848, + "max_norm/layer15": 11.166800498962402, + "max_norm/layer16": 10.781830787658691, + "max_norm/layer17": 11.687150001525879, + "max_norm/layer18": 11.340291023254395, + "max_norm/layer19": 11.40336799621582, + "max_norm/layer2": 11.241272926330566, + "max_norm/layer20": 11.293827056884766, + "max_norm/layer21": 11.938570022583008, + "max_norm/layer22": 11.450465202331543, + "max_norm/layer23": 11.329928398132324, + "max_norm/layer3": 11.215670585632324, + "max_norm/layer4": 11.24952507019043, + "max_norm/layer5": 11.489554405212402, + "max_norm/layer6": 11.858213424682617, + "max_norm/layer7": 11.412649154663086, + "max_norm/layer8": 11.180521011352539, + "max_norm/layer9": 11.323616981506348, + "mean_norm": 7.995976222058137, + "mean_norm/layer0": 8.02781367301941, + "mean_norm/layer1": 8.001955300569534, + "mean_norm/layer10": 7.991945534944534, + "mean_norm/layer11": 7.994345277547836, + "mean_norm/layer12": 7.9973015785217285, + "mean_norm/layer13": 7.990174353122711, + "mean_norm/layer14": 7.994365036487579, + "mean_norm/layer15": 7.9937964379787445, + "mean_norm/layer16": 7.993947863578796, + "mean_norm/layer17": 7.9963139295578, + "mean_norm/layer18": 7.992857217788696, + "mean_norm/layer19": 7.993478715419769, + "mean_norm/layer2": 7.984907865524292, + "mean_norm/layer20": 7.996965527534485, + "mean_norm/layer21": 7.9976761639118195, + "mean_norm/layer22": 7.997446715831757, + "mean_norm/layer23": 7.995190799236298, + "mean_norm/layer3": 8.00449624657631, + "mean_norm/layer4": 7.99257630109787, + "mean_norm/layer5": 8.008823156356812, + "mean_norm/layer6": 7.9886175096035, + "mean_norm/layer7": 7.985989451408386, + "mean_norm/layer8": 7.991247743368149, + "mean_norm/layer9": 7.991196930408478, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 100 + }, + { + "epoch": 0.04, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.3217572593827446, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.9806430339813232, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8323, + "eval_samples_per_second": 20.368, + "eval_steps_per_second": 0.676, + "step": 100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.06, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.8442, + "max_norm": 11.94873046875, + "max_norm/layer0": 11.583314895629883, + "max_norm/layer1": 11.257062911987305, + "max_norm/layer10": 11.477036476135254, + "max_norm/layer11": 11.486359596252441, + "max_norm/layer12": 11.094036102294922, + "max_norm/layer13": 11.006564140319824, + "max_norm/layer14": 11.83369255065918, + "max_norm/layer15": 11.174107551574707, + "max_norm/layer16": 10.795401573181152, + "max_norm/layer17": 11.689741134643555, + "max_norm/layer18": 11.353045463562012, + "max_norm/layer19": 11.423429489135742, + "max_norm/layer2": 11.241215705871582, + "max_norm/layer20": 11.297418594360352, + "max_norm/layer21": 11.94873046875, + "max_norm/layer22": 11.467409133911133, + "max_norm/layer23": 11.351099014282227, + "max_norm/layer3": 11.237198829650879, + "max_norm/layer4": 11.2833833694458, + "max_norm/layer5": 11.501317024230957, + "max_norm/layer6": 11.842484474182129, + "max_norm/layer7": 11.412476539611816, + "max_norm/layer8": 11.197505950927734, + "max_norm/layer9": 11.32548713684082, + "mean_norm": 8.025902200490236, + "mean_norm/layer0": 8.05369970202446, + "mean_norm/layer1": 8.029805958271027, + "mean_norm/layer10": 8.019342005252838, + "mean_norm/layer11": 8.026309847831726, + "mean_norm/layer12": 8.027727752923965, + "mean_norm/layer13": 8.017128229141235, + "mean_norm/layer14": 8.023246347904205, + "mean_norm/layer15": 8.024851232767105, + "mean_norm/layer16": 8.020187258720398, + "mean_norm/layer17": 8.030142724514008, + "mean_norm/layer18": 8.022860586643219, + "mean_norm/layer19": 8.024217784404755, + "mean_norm/layer2": 8.00149068236351, + "mean_norm/layer20": 8.02658200263977, + "mean_norm/layer21": 8.028845071792603, + "mean_norm/layer22": 8.0383882522583, + "mean_norm/layer23": 8.036098837852478, + "mean_norm/layer3": 8.042394787073135, + "mean_norm/layer4": 8.019146829843521, + "mean_norm/layer5": 8.053219020366669, + "mean_norm/layer6": 8.007382929325104, + "mean_norm/layer7": 8.00985363125801, + "mean_norm/layer8": 8.019103825092316, + "mean_norm/layer9": 8.019627511501312, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 150 + }, + { + "epoch": 0.06, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.35747922269137633, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.630153179168701, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8097, + "eval_samples_per_second": 20.407, + "eval_steps_per_second": 0.677, + "step": 150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.08, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.6253, + "max_norm": 11.97680950164795, + "max_norm/layer0": 11.58055591583252, + "max_norm/layer1": 11.294157028198242, + "max_norm/layer10": 11.497956275939941, + "max_norm/layer11": 11.496185302734375, + "max_norm/layer12": 11.096875190734863, + "max_norm/layer13": 11.013715744018555, + "max_norm/layer14": 11.834508895874023, + "max_norm/layer15": 11.183530807495117, + "max_norm/layer16": 10.824295043945312, + "max_norm/layer17": 11.690849304199219, + "max_norm/layer18": 11.363268852233887, + "max_norm/layer19": 11.44228744506836, + "max_norm/layer2": 11.241418838500977, + "max_norm/layer20": 11.30195140838623, + "max_norm/layer21": 11.97680950164795, + "max_norm/layer22": 11.490119934082031, + "max_norm/layer23": 11.360661506652832, + "max_norm/layer3": 11.250357627868652, + "max_norm/layer4": 11.294978141784668, + "max_norm/layer5": 11.523475646972656, + "max_norm/layer6": 11.833582878112793, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.238706588745117, + "max_norm/layer9": 11.328913688659668, + "mean_norm": 8.050771818806728, + "mean_norm/layer0": 8.074532568454742, + "mean_norm/layer1": 8.053631067276001, + "mean_norm/layer10": 8.043468981981277, + "mean_norm/layer11": 8.05247575044632, + "mean_norm/layer12": 8.05384948849678, + "mean_norm/layer13": 8.039159834384918, + "mean_norm/layer14": 8.047386288642883, + "mean_norm/layer15": 8.051487892866135, + "mean_norm/layer16": 8.041515946388245, + "mean_norm/layer17": 8.056637048721313, + "mean_norm/layer18": 8.044140785932541, + "mean_norm/layer19": 8.046563893556595, + "mean_norm/layer2": 8.015393018722534, + "mean_norm/layer20": 8.04814100265503, + "mean_norm/layer21": 8.051321744918823, + "mean_norm/layer22": 8.069881677627563, + "mean_norm/layer23": 8.0706427693367, + "mean_norm/layer3": 8.075534343719482, + "mean_norm/layer4": 8.043230772018433, + "mean_norm/layer5": 8.093363732099533, + "mean_norm/layer6": 8.024461150169373, + "mean_norm/layer7": 8.032397478818893, + "mean_norm/layer8": 8.044481456279755, + "mean_norm/layer9": 8.044824957847595, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 200 + }, + { + "epoch": 0.08, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.37222310104119766, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.484011650085449, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8014, + "eval_samples_per_second": 22.312, + "eval_steps_per_second": 0.741, + "step": 200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.1, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.5035, + "max_norm": 12.000293731689453, + "max_norm/layer0": 11.585112571716309, + "max_norm/layer1": 11.333687782287598, + "max_norm/layer10": 11.51988410949707, + "max_norm/layer11": 11.502758979797363, + "max_norm/layer12": 11.100769996643066, + "max_norm/layer13": 11.01984977722168, + "max_norm/layer14": 11.828566551208496, + "max_norm/layer15": 11.194990158081055, + "max_norm/layer16": 10.869253158569336, + "max_norm/layer17": 11.693120002746582, + "max_norm/layer18": 11.377907752990723, + "max_norm/layer19": 11.457249641418457, + "max_norm/layer2": 11.241273880004883, + "max_norm/layer20": 11.306483268737793, + "max_norm/layer21": 12.000293731689453, + "max_norm/layer22": 11.509583473205566, + "max_norm/layer23": 11.3687744140625, + "max_norm/layer3": 11.266392707824707, + "max_norm/layer4": 11.302397727966309, + "max_norm/layer5": 11.550718307495117, + "max_norm/layer6": 11.818743705749512, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.272293090820312, + "max_norm/layer9": 11.33436107635498, + "mean_norm": 8.074364328136047, + "mean_norm/layer0": 8.09387719631195, + "mean_norm/layer1": 8.07526409626007, + "mean_norm/layer10": 8.067595720291138, + "mean_norm/layer11": 8.078146398067474, + "mean_norm/layer12": 8.079148262739182, + "mean_norm/layer13": 8.059981882572174, + "mean_norm/layer14": 8.070948004722595, + "mean_norm/layer15": 8.077279716730118, + "mean_norm/layer16": 8.061559438705444, + "mean_norm/layer17": 8.080615043640137, + "mean_norm/layer18": 8.063488155603409, + "mean_norm/layer19": 8.066218882799149, + "mean_norm/layer2": 8.028005808591843, + "mean_norm/layer20": 8.067834615707397, + "mean_norm/layer21": 8.071941196918488, + "mean_norm/layer22": 8.098706185817719, + "mean_norm/layer23": 8.10308825969696, + "mean_norm/layer3": 8.106619775295258, + "mean_norm/layer4": 8.066012859344482, + "mean_norm/layer5": 8.132562160491943, + "mean_norm/layer6": 8.041042983531952, + "mean_norm/layer7": 8.054872512817383, + "mean_norm/layer8": 8.07003739476204, + "mean_norm/layer9": 8.069897323846817, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 250 + }, + { + "epoch": 0.1, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.38236737607638427, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.3861122131347656, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.55, + "eval_samples_per_second": 20.866, + "eval_steps_per_second": 0.693, + "step": 250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.13, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.4446, + "max_norm": 12.001006126403809, + "max_norm/layer0": 11.589604377746582, + "max_norm/layer1": 11.3706693649292, + "max_norm/layer10": 11.548222541809082, + "max_norm/layer11": 11.507245063781738, + "max_norm/layer12": 11.113755226135254, + "max_norm/layer13": 11.024701118469238, + "max_norm/layer14": 11.826601028442383, + "max_norm/layer15": 11.213644027709961, + "max_norm/layer16": 10.893625259399414, + "max_norm/layer17": 11.694713592529297, + "max_norm/layer18": 11.386850357055664, + "max_norm/layer19": 11.475567817687988, + "max_norm/layer2": 11.24197769165039, + "max_norm/layer20": 11.314746856689453, + "max_norm/layer21": 12.001006126403809, + "max_norm/layer22": 11.535944938659668, + "max_norm/layer23": 11.374551773071289, + "max_norm/layer3": 11.290938377380371, + "max_norm/layer4": 11.314577102661133, + "max_norm/layer5": 11.561954498291016, + "max_norm/layer6": 11.800447463989258, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.313380241394043, + "max_norm/layer9": 11.339631080627441, + "mean_norm": 8.098208792507648, + "mean_norm/layer0": 8.112719625234604, + "mean_norm/layer1": 8.09641945362091, + "mean_norm/layer10": 8.09212476015091, + "mean_norm/layer11": 8.104212701320648, + "mean_norm/layer12": 8.105414420366287, + "mean_norm/layer13": 8.080646514892578, + "mean_norm/layer14": 8.094950437545776, + "mean_norm/layer15": 8.103815019130707, + "mean_norm/layer16": 8.082140505313873, + "mean_norm/layer17": 8.104914009571075, + "mean_norm/layer18": 8.082397997379303, + "mean_norm/layer19": 8.085450172424316, + "mean_norm/layer2": 8.041804730892181, + "mean_norm/layer20": 8.088390350341797, + "mean_norm/layer21": 8.09272289276123, + "mean_norm/layer22": 8.127672553062439, + "mean_norm/layer23": 8.135194897651672, + "mean_norm/layer3": 8.137898802757263, + "mean_norm/layer4": 8.089071333408356, + "mean_norm/layer5": 8.171739280223846, + "mean_norm/layer6": 8.057810544967651, + "mean_norm/layer7": 8.078491449356079, + "mean_norm/layer8": 8.095423579216003, + "mean_norm/layer9": 8.095584988594055, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 300 + }, + { + "epoch": 0.13, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.387530775564506, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.338789701461792, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8547, + "eval_samples_per_second": 20.329, + "eval_steps_per_second": 0.675, + "step": 300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.15, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.3923, + "max_norm": 12.015610694885254, + "max_norm/layer0": 11.587407112121582, + "max_norm/layer1": 11.411787986755371, + "max_norm/layer10": 11.574077606201172, + "max_norm/layer11": 11.51120376586914, + "max_norm/layer12": 11.12320613861084, + "max_norm/layer13": 11.032407760620117, + "max_norm/layer14": 11.822674751281738, + "max_norm/layer15": 11.238204956054688, + "max_norm/layer16": 10.920355796813965, + "max_norm/layer17": 11.699063301086426, + "max_norm/layer18": 11.408402442932129, + "max_norm/layer19": 11.491950035095215, + "max_norm/layer2": 11.242212295532227, + "max_norm/layer20": 11.323861122131348, + "max_norm/layer21": 12.015610694885254, + "max_norm/layer22": 11.565690040588379, + "max_norm/layer23": 11.3798828125, + "max_norm/layer3": 11.31166934967041, + "max_norm/layer4": 11.336499214172363, + "max_norm/layer5": 11.575148582458496, + "max_norm/layer6": 11.771903038024902, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.338603973388672, + "max_norm/layer9": 11.345176696777344, + "mean_norm": 8.122111474474272, + "mean_norm/layer0": 8.130385041236877, + "mean_norm/layer1": 8.116739928722382, + "mean_norm/layer10": 8.117430806159973, + "mean_norm/layer11": 8.13034301996231, + "mean_norm/layer12": 8.132402211427689, + "mean_norm/layer13": 8.10273027420044, + "mean_norm/layer14": 8.119827210903168, + "mean_norm/layer15": 8.131300270557404, + "mean_norm/layer16": 8.103004693984985, + "mean_norm/layer17": 8.129256963729858, + "mean_norm/layer18": 8.101572036743164, + "mean_norm/layer19": 8.104348003864288, + "mean_norm/layer2": 8.053901731967926, + "mean_norm/layer20": 8.108955979347229, + "mean_norm/layer21": 8.113863289356232, + "mean_norm/layer22": 8.156916499137878, + "mean_norm/layer23": 8.166612327098846, + "mean_norm/layer3": 8.168688178062439, + "mean_norm/layer4": 8.11172890663147, + "mean_norm/layer5": 8.211617052555084, + "mean_norm/layer6": 8.074544966220856, + "mean_norm/layer7": 8.101724714040756, + "mean_norm/layer8": 8.12110459804535, + "mean_norm/layer9": 8.121676683425903, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 350 + }, + { + "epoch": 0.15, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.3928604746433685, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.292882204055786, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8031, + "eval_samples_per_second": 20.418, + "eval_steps_per_second": 0.678, + "step": 350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.17, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.3488, + "max_norm": 12.052452087402344, + "max_norm/layer0": 11.583168983459473, + "max_norm/layer1": 11.448755264282227, + "max_norm/layer10": 11.607074737548828, + "max_norm/layer11": 11.51498794555664, + "max_norm/layer12": 11.131906509399414, + "max_norm/layer13": 11.042832374572754, + "max_norm/layer14": 11.821359634399414, + "max_norm/layer15": 11.259943962097168, + "max_norm/layer16": 10.950507164001465, + "max_norm/layer17": 11.704728126525879, + "max_norm/layer18": 11.416481971740723, + "max_norm/layer19": 11.509549140930176, + "max_norm/layer2": 11.243173599243164, + "max_norm/layer20": 11.331818580627441, + "max_norm/layer21": 12.052452087402344, + "max_norm/layer22": 11.601603507995605, + "max_norm/layer23": 11.385972023010254, + "max_norm/layer3": 11.330273628234863, + "max_norm/layer4": 11.340890884399414, + "max_norm/layer5": 11.589158058166504, + "max_norm/layer6": 11.758391380310059, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.364471435546875, + "max_norm/layer9": 11.363606452941895, + "mean_norm": 8.146464373916388, + "mean_norm/layer0": 8.147882997989655, + "mean_norm/layer1": 8.137409269809723, + "mean_norm/layer10": 8.143800973892212, + "mean_norm/layer11": 8.15701961517334, + "mean_norm/layer12": 8.159733355045319, + "mean_norm/layer13": 8.12478882074356, + "mean_norm/layer14": 8.144879519939423, + "mean_norm/layer15": 8.15983933210373, + "mean_norm/layer16": 8.124275922775269, + "mean_norm/layer17": 8.154035031795502, + "mean_norm/layer18": 8.12134873867035, + "mean_norm/layer19": 8.123763740062714, + "mean_norm/layer2": 8.06533831357956, + "mean_norm/layer20": 8.130630254745483, + "mean_norm/layer21": 8.135239839553833, + "mean_norm/layer22": 8.187315464019775, + "mean_norm/layer23": 8.198715567588806, + "mean_norm/layer3": 8.200076937675476, + "mean_norm/layer4": 8.13455080986023, + "mean_norm/layer5": 8.252391397953033, + "mean_norm/layer6": 8.09180998802185, + "mean_norm/layer7": 8.12533888220787, + "mean_norm/layer8": 8.147203147411346, + "mean_norm/layer9": 8.147757053375244, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 400 + }, + { + "epoch": 0.17, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.39780890148980097, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.262259006500244, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5766, + "eval_samples_per_second": 20.818, + "eval_steps_per_second": 0.691, + "step": 400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.19, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.3177, + "max_norm": 12.075408935546875, + "max_norm/layer0": 11.58000373840332, + "max_norm/layer1": 11.467397689819336, + "max_norm/layer10": 11.6430082321167, + "max_norm/layer11": 11.519189834594727, + "max_norm/layer12": 11.167428016662598, + "max_norm/layer13": 11.051277160644531, + "max_norm/layer14": 11.820220947265625, + "max_norm/layer15": 11.288527488708496, + "max_norm/layer16": 10.984353065490723, + "max_norm/layer17": 11.70883846282959, + "max_norm/layer18": 11.42200756072998, + "max_norm/layer19": 11.528905868530273, + "max_norm/layer2": 11.243820190429688, + "max_norm/layer20": 11.341607093811035, + "max_norm/layer21": 12.075408935546875, + "max_norm/layer22": 11.638215065002441, + "max_norm/layer23": 11.391865730285645, + "max_norm/layer3": 11.364630699157715, + "max_norm/layer4": 11.353809356689453, + "max_norm/layer5": 11.606606483459473, + "max_norm/layer6": 11.743355751037598, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.400062561035156, + "max_norm/layer9": 11.37598991394043, + "mean_norm": 8.171071887016296, + "mean_norm/layer0": 8.165462255477905, + "mean_norm/layer1": 8.157464504241943, + "mean_norm/layer10": 8.170145452022552, + "mean_norm/layer11": 8.183974206447601, + "mean_norm/layer12": 8.187600195407867, + "mean_norm/layer13": 8.146990656852722, + "mean_norm/layer14": 8.170723497867584, + "mean_norm/layer15": 8.188680768013, + "mean_norm/layer16": 8.146208465099335, + "mean_norm/layer17": 8.179404616355896, + "mean_norm/layer18": 8.141136407852173, + "mean_norm/layer19": 8.14376151561737, + "mean_norm/layer2": 8.07688194513321, + "mean_norm/layer20": 8.152221620082855, + "mean_norm/layer21": 8.15705955028534, + "mean_norm/layer22": 8.21717494726181, + "mean_norm/layer23": 8.23116946220398, + "mean_norm/layer3": 8.231843888759613, + "mean_norm/layer4": 8.15757131576538, + "mean_norm/layer5": 8.294019222259521, + "mean_norm/layer6": 8.10983818769455, + "mean_norm/layer7": 8.148617386817932, + "mean_norm/layer8": 8.17370468378067, + "mean_norm/layer9": 8.174070537090302, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 450 + }, + { + "epoch": 0.19, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.3994718973972086, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.232194423675537, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8086, + "eval_samples_per_second": 20.409, + "eval_steps_per_second": 0.677, + "step": 450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.21, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2894, + "max_norm": 12.08602237701416, + "max_norm/layer0": 11.57630443572998, + "max_norm/layer1": 11.500665664672852, + "max_norm/layer10": 11.685675621032715, + "max_norm/layer11": 11.524746894836426, + "max_norm/layer12": 11.200533866882324, + "max_norm/layer13": 11.057424545288086, + "max_norm/layer14": 11.818695068359375, + "max_norm/layer15": 11.327396392822266, + "max_norm/layer16": 11.003171920776367, + "max_norm/layer17": 11.71567440032959, + "max_norm/layer18": 11.435552597045898, + "max_norm/layer19": 11.560956954956055, + "max_norm/layer2": 11.249007225036621, + "max_norm/layer20": 11.35300350189209, + "max_norm/layer21": 12.08602237701416, + "max_norm/layer22": 11.681539535522461, + "max_norm/layer23": 11.402434349060059, + "max_norm/layer3": 11.39268684387207, + "max_norm/layer4": 11.360640525817871, + "max_norm/layer5": 11.629146575927734, + "max_norm/layer6": 11.73115348815918, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.449997901916504, + "max_norm/layer9": 11.38539981842041, + "mean_norm": 8.196226223061482, + "mean_norm/layer0": 8.182831525802612, + "mean_norm/layer1": 8.177292108535767, + "mean_norm/layer10": 8.197421550750732, + "mean_norm/layer11": 8.212226867675781, + "mean_norm/layer12": 8.216940701007843, + "mean_norm/layer13": 8.170343518257141, + "mean_norm/layer14": 8.197417199611664, + "mean_norm/layer15": 8.218412935733795, + "mean_norm/layer16": 8.168900430202484, + "mean_norm/layer17": 8.205419719219208, + "mean_norm/layer18": 8.161637961864471, + "mean_norm/layer19": 8.164183616638184, + "mean_norm/layer2": 8.088469088077545, + "mean_norm/layer20": 8.17502224445343, + "mean_norm/layer21": 8.179168939590454, + "mean_norm/layer22": 8.248070120811462, + "mean_norm/layer23": 8.263128936290741, + "mean_norm/layer3": 8.263891696929932, + "mean_norm/layer4": 8.180212199687958, + "mean_norm/layer5": 8.336524426937103, + "mean_norm/layer6": 8.128240823745728, + "mean_norm/layer7": 8.172141283750534, + "mean_norm/layer8": 8.200634181499481, + "mean_norm/layer9": 8.20089727640152, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 500 + }, + { + "epoch": 0.21, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4021610834621141, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.2090389728546143, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5576, + "eval_samples_per_second": 20.852, + "eval_steps_per_second": 0.692, + "step": 500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.23, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2724, + "max_norm": 12.093631744384766, + "max_norm/layer0": 11.574031829833984, + "max_norm/layer1": 11.520513534545898, + "max_norm/layer10": 11.72606372833252, + "max_norm/layer11": 11.533076286315918, + "max_norm/layer12": 11.226149559020996, + "max_norm/layer13": 11.076735496520996, + "max_norm/layer14": 11.817575454711914, + "max_norm/layer15": 11.362285614013672, + "max_norm/layer16": 11.021040916442871, + "max_norm/layer17": 11.723470687866211, + "max_norm/layer18": 11.440601348876953, + "max_norm/layer19": 11.586626052856445, + "max_norm/layer2": 11.307050704956055, + "max_norm/layer20": 11.366878509521484, + "max_norm/layer21": 12.093631744384766, + "max_norm/layer22": 11.715110778808594, + "max_norm/layer23": 11.419413566589355, + "max_norm/layer3": 11.408477783203125, + "max_norm/layer4": 11.373757362365723, + "max_norm/layer5": 11.641069412231445, + "max_norm/layer6": 11.724522590637207, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.494658470153809, + "max_norm/layer9": 11.404236793518066, + "mean_norm": 8.221715872486433, + "mean_norm/layer0": 8.199663996696472, + "mean_norm/layer1": 8.197345733642578, + "mean_norm/layer10": 8.224578857421875, + "mean_norm/layer11": 8.241481006145477, + "mean_norm/layer12": 8.246900916099548, + "mean_norm/layer13": 8.194350957870483, + "mean_norm/layer14": 8.224222719669342, + "mean_norm/layer15": 8.249268531799316, + "mean_norm/layer16": 8.192130506038666, + "mean_norm/layer17": 8.23191773891449, + "mean_norm/layer18": 8.183155179023743, + "mean_norm/layer19": 8.184997946023941, + "mean_norm/layer2": 8.100345313549042, + "mean_norm/layer20": 8.198180854320526, + "mean_norm/layer21": 8.201505959033966, + "mean_norm/layer22": 8.27897161245346, + "mean_norm/layer23": 8.2966029047966, + "mean_norm/layer3": 8.295648694038391, + "mean_norm/layer4": 8.202883422374725, + "mean_norm/layer5": 8.379289329051971, + "mean_norm/layer6": 8.146961510181427, + "mean_norm/layer7": 8.195779234170914, + "mean_norm/layer8": 8.22712391614914, + "mean_norm/layer9": 8.227874100208282, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 550 + }, + { + "epoch": 0.23, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4047083064617531, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.19132661819458, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8083, + "eval_samples_per_second": 20.409, + "eval_steps_per_second": 0.677, + "step": 550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.25, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2613, + "max_norm": 12.08575439453125, + "max_norm/layer0": 11.57294750213623, + "max_norm/layer1": 11.550745010375977, + "max_norm/layer10": 11.778457641601562, + "max_norm/layer11": 11.543680191040039, + "max_norm/layer12": 11.26294231414795, + "max_norm/layer13": 11.098902702331543, + "max_norm/layer14": 11.818066596984863, + "max_norm/layer15": 11.396076202392578, + "max_norm/layer16": 11.038070678710938, + "max_norm/layer17": 11.729777336120605, + "max_norm/layer18": 11.44991683959961, + "max_norm/layer19": 11.609344482421875, + "max_norm/layer2": 11.325920104980469, + "max_norm/layer20": 11.378867149353027, + "max_norm/layer21": 12.08575439453125, + "max_norm/layer22": 11.764599800109863, + "max_norm/layer23": 11.429723739624023, + "max_norm/layer3": 11.43395709991455, + "max_norm/layer4": 11.382811546325684, + "max_norm/layer5": 11.653532028198242, + "max_norm/layer6": 11.715897560119629, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.53526782989502, + "max_norm/layer9": 11.41949462890625, + "mean_norm": 8.2477020782729, + "mean_norm/layer0": 8.216517150402069, + "mean_norm/layer1": 8.217063426971436, + "mean_norm/layer10": 8.252220571041107, + "mean_norm/layer11": 8.27081310749054, + "mean_norm/layer12": 8.277320384979248, + "mean_norm/layer13": 8.218484103679657, + "mean_norm/layer14": 8.251877188682556, + "mean_norm/layer15": 8.280709624290466, + "mean_norm/layer16": 8.215820074081421, + "mean_norm/layer17": 8.259000062942505, + "mean_norm/layer18": 8.205557763576508, + "mean_norm/layer19": 8.20718702673912, + "mean_norm/layer2": 8.11178743839264, + "mean_norm/layer20": 8.222057938575745, + "mean_norm/layer21": 8.225264191627502, + "mean_norm/layer22": 8.31117445230484, + "mean_norm/layer23": 8.33020955324173, + "mean_norm/layer3": 8.328413903713226, + "mean_norm/layer4": 8.22685432434082, + "mean_norm/layer5": 8.42192029953003, + "mean_norm/layer6": 8.165671527385712, + "mean_norm/layer7": 8.219844996929169, + "mean_norm/layer8": 8.254268229007721, + "mean_norm/layer9": 8.25481253862381, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 600 + }, + { + "epoch": 0.25, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.40806674697720074, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.164001226425171, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8121, + "eval_samples_per_second": 20.403, + "eval_steps_per_second": 0.677, + "step": 600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.27, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2317, + "max_norm": 12.080315589904785, + "max_norm/layer0": 11.57314395904541, + "max_norm/layer1": 11.564712524414062, + "max_norm/layer10": 11.826842308044434, + "max_norm/layer11": 11.56205940246582, + "max_norm/layer12": 11.327191352844238, + "max_norm/layer13": 11.14234447479248, + "max_norm/layer14": 11.822623252868652, + "max_norm/layer15": 11.452949523925781, + "max_norm/layer16": 11.063272476196289, + "max_norm/layer17": 11.735552787780762, + "max_norm/layer18": 11.489537239074707, + "max_norm/layer19": 11.642096519470215, + "max_norm/layer2": 11.34683895111084, + "max_norm/layer20": 11.390698432922363, + "max_norm/layer21": 12.080315589904785, + "max_norm/layer22": 11.80964469909668, + "max_norm/layer23": 11.444567680358887, + "max_norm/layer3": 11.46610164642334, + "max_norm/layer4": 11.389155387878418, + "max_norm/layer5": 11.663924217224121, + "max_norm/layer6": 11.711557388305664, + "max_norm/layer7": 11.412418365478516, + "max_norm/layer8": 11.58823299407959, + "max_norm/layer9": 11.441153526306152, + "mean_norm": 8.27368176728487, + "mean_norm/layer0": 8.23319536447525, + "mean_norm/layer1": 8.236526012420654, + "mean_norm/layer10": 8.279936909675598, + "mean_norm/layer11": 8.300039291381836, + "mean_norm/layer12": 8.308358132839203, + "mean_norm/layer13": 8.24279397726059, + "mean_norm/layer14": 8.280017256736755, + "mean_norm/layer15": 8.31208449602127, + "mean_norm/layer16": 8.239376664161682, + "mean_norm/layer17": 8.286569893360138, + "mean_norm/layer18": 8.228154420852661, + "mean_norm/layer19": 8.229794263839722, + "mean_norm/layer2": 8.122508347034454, + "mean_norm/layer20": 8.247145473957062, + "mean_norm/layer21": 8.249900996685028, + "mean_norm/layer22": 8.343108773231506, + "mean_norm/layer23": 8.363870322704315, + "mean_norm/layer3": 8.359816431999207, + "mean_norm/layer4": 8.249790847301483, + "mean_norm/layer5": 8.46416860818863, + "mean_norm/layer6": 8.183874189853668, + "mean_norm/layer7": 8.243731617927551, + "mean_norm/layer8": 8.281560719013214, + "mean_norm/layer9": 8.282039403915405, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 650 + }, + { + "epoch": 0.27, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.40971351853429216, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.150172233581543, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.798, + "eval_samples_per_second": 20.427, + "eval_steps_per_second": 0.678, + "step": 650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.29, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2188, + "max_norm": 12.064549446105957, + "max_norm/layer0": 11.576369285583496, + "max_norm/layer1": 11.57625961303711, + "max_norm/layer10": 11.87590217590332, + "max_norm/layer11": 11.576005935668945, + "max_norm/layer12": 11.397974014282227, + "max_norm/layer13": 11.20036506652832, + "max_norm/layer14": 11.824828147888184, + "max_norm/layer15": 11.515402793884277, + "max_norm/layer16": 11.112325668334961, + "max_norm/layer17": 11.739395141601562, + "max_norm/layer18": 11.53075885772705, + "max_norm/layer19": 11.668770790100098, + "max_norm/layer2": 11.371235847473145, + "max_norm/layer20": 11.404346466064453, + "max_norm/layer21": 12.064549446105957, + "max_norm/layer22": 11.857187271118164, + "max_norm/layer23": 11.460153579711914, + "max_norm/layer3": 11.484306335449219, + "max_norm/layer4": 11.393518447875977, + "max_norm/layer5": 11.679058074951172, + "max_norm/layer6": 11.7113618850708, + "max_norm/layer7": 11.412549018859863, + "max_norm/layer8": 11.63630485534668, + "max_norm/layer9": 11.468382835388184, + "mean_norm": 8.29998386775454, + "mean_norm/layer0": 8.249696731567383, + "mean_norm/layer1": 8.255469501018524, + "mean_norm/layer10": 8.307538092136383, + "mean_norm/layer11": 8.328807175159454, + "mean_norm/layer12": 8.340057134628296, + "mean_norm/layer13": 8.267650306224823, + "mean_norm/layer14": 8.308513700962067, + "mean_norm/layer15": 8.343885838985443, + "mean_norm/layer16": 8.263654291629791, + "mean_norm/layer17": 8.315043985843658, + "mean_norm/layer18": 8.251324594020844, + "mean_norm/layer19": 8.253050774335861, + "mean_norm/layer2": 8.132669448852539, + "mean_norm/layer20": 8.273239970207214, + "mean_norm/layer21": 8.275495648384094, + "mean_norm/layer22": 8.376473069190979, + "mean_norm/layer23": 8.397179186344147, + "mean_norm/layer3": 8.391516983509064, + "mean_norm/layer4": 8.27236133813858, + "mean_norm/layer5": 8.507023572921753, + "mean_norm/layer6": 8.20206767320633, + "mean_norm/layer7": 8.268005192279816, + "mean_norm/layer8": 8.309515058994293, + "mean_norm/layer9": 8.309373557567596, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 700 + }, + { + "epoch": 0.29, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.411676664922549, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.1364951133728027, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7803, + "eval_samples_per_second": 20.458, + "eval_steps_per_second": 0.679, + "step": 700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.31, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.2161, + "max_norm": 12.05309772491455, + "max_norm/layer0": 11.57707691192627, + "max_norm/layer1": 11.590497970581055, + "max_norm/layer10": 11.933767318725586, + "max_norm/layer11": 11.590163230895996, + "max_norm/layer12": 11.48369312286377, + "max_norm/layer13": 11.255187034606934, + "max_norm/layer14": 11.825422286987305, + "max_norm/layer15": 11.571812629699707, + "max_norm/layer16": 11.15307331085205, + "max_norm/layer17": 11.7452392578125, + "max_norm/layer18": 11.56918716430664, + "max_norm/layer19": 11.707026481628418, + "max_norm/layer2": 11.40218448638916, + "max_norm/layer20": 11.431868553161621, + "max_norm/layer21": 12.05309772491455, + "max_norm/layer22": 11.90449333190918, + "max_norm/layer23": 11.471346855163574, + "max_norm/layer3": 11.509933471679688, + "max_norm/layer4": 11.459664344787598, + "max_norm/layer5": 11.687596321105957, + "max_norm/layer6": 11.70588207244873, + "max_norm/layer7": 11.449671745300293, + "max_norm/layer8": 11.691574096679688, + "max_norm/layer9": 11.537601470947266, + "mean_norm": 8.326080996543169, + "mean_norm/layer0": 8.265921652317047, + "mean_norm/layer1": 8.27424931526184, + "mean_norm/layer10": 8.334565043449402, + "mean_norm/layer11": 8.358085632324219, + "mean_norm/layer12": 8.371635675430298, + "mean_norm/layer13": 8.292467653751373, + "mean_norm/layer14": 8.336614668369293, + "mean_norm/layer15": 8.375074326992035, + "mean_norm/layer16": 8.288271248340607, + "mean_norm/layer17": 8.343531310558319, + "mean_norm/layer18": 8.274474322795868, + "mean_norm/layer19": 8.276240915060043, + "mean_norm/layer2": 8.142491519451141, + "mean_norm/layer20": 8.299282789230347, + "mean_norm/layer21": 8.301438212394714, + "mean_norm/layer22": 8.409608781337738, + "mean_norm/layer23": 8.431357860565186, + "mean_norm/layer3": 8.42233693599701, + "mean_norm/layer4": 8.29524427652359, + "mean_norm/layer5": 8.54966390132904, + "mean_norm/layer6": 8.2197967171669, + "mean_norm/layer7": 8.291634261608124, + "mean_norm/layer8": 8.336127936840057, + "mean_norm/layer9": 8.335828959941864, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 750 + }, + { + "epoch": 0.31, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.41466194538072465, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.1243374347686768, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7875, + "eval_samples_per_second": 20.445, + "eval_steps_per_second": 0.679, + "step": 750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.33, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1922, + "max_norm": 12.044909477233887, + "max_norm/layer0": 11.577107429504395, + "max_norm/layer1": 11.596969604492188, + "max_norm/layer10": 11.989384651184082, + "max_norm/layer11": 11.607263565063477, + "max_norm/layer12": 11.563121795654297, + "max_norm/layer13": 11.30004596710205, + "max_norm/layer14": 11.83565616607666, + "max_norm/layer15": 11.635966300964355, + "max_norm/layer16": 11.215364456176758, + "max_norm/layer17": 11.751420974731445, + "max_norm/layer18": 11.606756210327148, + "max_norm/layer19": 11.731042861938477, + "max_norm/layer2": 11.428869247436523, + "max_norm/layer20": 11.478826522827148, + "max_norm/layer21": 12.044909477233887, + "max_norm/layer22": 11.962320327758789, + "max_norm/layer23": 11.527593612670898, + "max_norm/layer3": 11.53365707397461, + "max_norm/layer4": 11.52773666381836, + "max_norm/layer5": 11.69833755493164, + "max_norm/layer6": 11.700189590454102, + "max_norm/layer7": 11.472933769226074, + "max_norm/layer8": 11.752439498901367, + "max_norm/layer9": 11.594074249267578, + "mean_norm": 8.351811222732067, + "mean_norm/layer0": 8.281863927841187, + "mean_norm/layer1": 8.29244977235794, + "mean_norm/layer10": 8.361223697662354, + "mean_norm/layer11": 8.386799097061157, + "mean_norm/layer12": 8.403019607067108, + "mean_norm/layer13": 8.316332519054413, + "mean_norm/layer14": 8.364771544933319, + "mean_norm/layer15": 8.405999541282654, + "mean_norm/layer16": 8.312246263027191, + "mean_norm/layer17": 8.372030258178711, + "mean_norm/layer18": 8.297933518886566, + "mean_norm/layer19": 8.299460768699646, + "mean_norm/layer2": 8.151886761188507, + "mean_norm/layer20": 8.324509799480438, + "mean_norm/layer21": 8.326754689216614, + "mean_norm/layer22": 8.443054556846619, + "mean_norm/layer23": 8.464609026908875, + "mean_norm/layer3": 8.452716946601868, + "mean_norm/layer4": 8.317551970481873, + "mean_norm/layer5": 8.592187523841858, + "mean_norm/layer6": 8.237367451190948, + "mean_norm/layer7": 8.314523756504059, + "mean_norm/layer8": 8.362704694271088, + "mean_norm/layer9": 8.36147165298462, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 800 + }, + { + "epoch": 0.33, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.41583821077864713, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.110368251800537, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7951, + "eval_samples_per_second": 20.432, + "eval_steps_per_second": 0.678, + "step": 800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.35, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1722, + "max_norm": 12.041813850402832, + "max_norm/layer0": 11.581586837768555, + "max_norm/layer1": 11.61563491821289, + "max_norm/layer10": 12.041813850402832, + "max_norm/layer11": 11.62158203125, + "max_norm/layer12": 11.668936729431152, + "max_norm/layer13": 11.349258422851562, + "max_norm/layer14": 11.871787071228027, + "max_norm/layer15": 11.716175079345703, + "max_norm/layer16": 11.261540412902832, + "max_norm/layer17": 11.757204055786133, + "max_norm/layer18": 11.649191856384277, + "max_norm/layer19": 11.76467514038086, + "max_norm/layer2": 11.455350875854492, + "max_norm/layer20": 11.54249382019043, + "max_norm/layer21": 12.034183502197266, + "max_norm/layer22": 12.032604217529297, + "max_norm/layer23": 11.640424728393555, + "max_norm/layer3": 11.551873207092285, + "max_norm/layer4": 11.593846321105957, + "max_norm/layer5": 11.747194290161133, + "max_norm/layer6": 11.696702003479004, + "max_norm/layer7": 11.496893882751465, + "max_norm/layer8": 11.801105499267578, + "max_norm/layer9": 11.650264739990234, + "mean_norm": 8.377701930701733, + "mean_norm/layer0": 8.297932505607605, + "mean_norm/layer1": 8.310682237148285, + "mean_norm/layer10": 8.388074398040771, + "mean_norm/layer11": 8.416272222995758, + "mean_norm/layer12": 8.433896124362946, + "mean_norm/layer13": 8.340609431266785, + "mean_norm/layer14": 8.393010914325714, + "mean_norm/layer15": 8.437807321548462, + "mean_norm/layer16": 8.33694452047348, + "mean_norm/layer17": 8.400605857372284, + "mean_norm/layer18": 8.321976900100708, + "mean_norm/layer19": 8.323336660861969, + "mean_norm/layer2": 8.161349713802338, + "mean_norm/layer20": 8.351431608200073, + "mean_norm/layer21": 8.352801442146301, + "mean_norm/layer22": 8.476556599140167, + "mean_norm/layer23": 8.498172104358673, + "mean_norm/layer3": 8.483105719089508, + "mean_norm/layer4": 8.33917647600174, + "mean_norm/layer5": 8.63397741317749, + "mean_norm/layer6": 8.25437742471695, + "mean_norm/layer7": 8.337139964103699, + "mean_norm/layer8": 8.388812839984894, + "mean_norm/layer9": 8.386795938014984, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 850 + }, + { + "epoch": 0.35, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.41578142555254055, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0969085693359375, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8094, + "eval_samples_per_second": 20.407, + "eval_steps_per_second": 0.677, + "step": 850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.38, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1726, + "max_norm": 12.105155944824219, + "max_norm/layer0": 11.583524703979492, + "max_norm/layer1": 11.676701545715332, + "max_norm/layer10": 12.105155944824219, + "max_norm/layer11": 11.638466835021973, + "max_norm/layer12": 11.77223014831543, + "max_norm/layer13": 11.394583702087402, + "max_norm/layer14": 11.909969329833984, + "max_norm/layer15": 11.791295051574707, + "max_norm/layer16": 11.316922187805176, + "max_norm/layer17": 11.762696266174316, + "max_norm/layer18": 11.696808815002441, + "max_norm/layer19": 11.803051948547363, + "max_norm/layer2": 11.476975440979004, + "max_norm/layer20": 11.61272144317627, + "max_norm/layer21": 12.020544052124023, + "max_norm/layer22": 12.087778091430664, + "max_norm/layer23": 11.726238250732422, + "max_norm/layer3": 11.56999683380127, + "max_norm/layer4": 11.669652938842773, + "max_norm/layer5": 11.824197769165039, + "max_norm/layer6": 11.70715045928955, + "max_norm/layer7": 11.523516654968262, + "max_norm/layer8": 11.856184005737305, + "max_norm/layer9": 11.70484447479248, + "mean_norm": 8.403302758932114, + "mean_norm/layer0": 8.313547551631927, + "mean_norm/layer1": 8.32844340801239, + "mean_norm/layer10": 8.414072811603546, + "mean_norm/layer11": 8.445135712623596, + "mean_norm/layer12": 8.465462267398834, + "mean_norm/layer13": 8.364917397499084, + "mean_norm/layer14": 8.421625912189484, + "mean_norm/layer15": 8.468998491764069, + "mean_norm/layer16": 8.361238062381744, + "mean_norm/layer17": 8.429136097431183, + "mean_norm/layer18": 8.345595300197601, + "mean_norm/layer19": 8.347301244735718, + "mean_norm/layer2": 8.170057713985443, + "mean_norm/layer20": 8.378221929073334, + "mean_norm/layer21": 8.378659009933472, + "mean_norm/layer22": 8.510486662387848, + "mean_norm/layer23": 8.53170108795166, + "mean_norm/layer3": 8.512450098991394, + "mean_norm/layer4": 8.360101521015167, + "mean_norm/layer5": 8.675426006317139, + "mean_norm/layer6": 8.27113664150238, + "mean_norm/layer7": 8.359546661376953, + "mean_norm/layer8": 8.414047420024872, + "mean_norm/layer9": 8.411957204341888, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 900 + }, + { + "epoch": 0.38, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4186653038212401, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0817902088165283, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5214, + "eval_samples_per_second": 20.918, + "eval_steps_per_second": 0.694, + "step": 900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.4, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1672, + "max_norm": 12.155872344970703, + "max_norm/layer0": 11.587013244628906, + "max_norm/layer1": 11.7393217086792, + "max_norm/layer10": 12.155872344970703, + "max_norm/layer11": 11.661779403686523, + "max_norm/layer12": 11.862051963806152, + "max_norm/layer13": 11.456026077270508, + "max_norm/layer14": 11.942784309387207, + "max_norm/layer15": 11.870194435119629, + "max_norm/layer16": 11.392291069030762, + "max_norm/layer17": 11.770665168762207, + "max_norm/layer18": 11.740965843200684, + "max_norm/layer19": 11.83622932434082, + "max_norm/layer2": 11.501779556274414, + "max_norm/layer20": 11.678656578063965, + "max_norm/layer21": 12.005668640136719, + "max_norm/layer22": 12.143045425415039, + "max_norm/layer23": 11.798517227172852, + "max_norm/layer3": 11.589555740356445, + "max_norm/layer4": 11.730375289916992, + "max_norm/layer5": 11.893560409545898, + "max_norm/layer6": 11.800168991088867, + "max_norm/layer7": 11.626232147216797, + "max_norm/layer8": 11.903609275817871, + "max_norm/layer9": 11.769264221191406, + "mean_norm": 8.42872379720211, + "mean_norm/layer0": 8.329014301300049, + "mean_norm/layer1": 8.345844089984894, + "mean_norm/layer10": 8.440021395683289, + "mean_norm/layer11": 8.47356379032135, + "mean_norm/layer12": 8.4962397813797, + "mean_norm/layer13": 8.388897180557251, + "mean_norm/layer14": 8.449989914894104, + "mean_norm/layer15": 8.499238908290863, + "mean_norm/layer16": 8.385041534900665, + "mean_norm/layer17": 8.458029627799988, + "mean_norm/layer18": 8.369693100452423, + "mean_norm/layer19": 8.371399164199829, + "mean_norm/layer2": 8.178799033164978, + "mean_norm/layer20": 8.405226469039917, + "mean_norm/layer21": 8.40516346693039, + "mean_norm/layer22": 8.544622302055359, + "mean_norm/layer23": 8.565294981002808, + "mean_norm/layer3": 8.541715741157532, + "mean_norm/layer4": 8.380447745323181, + "mean_norm/layer5": 8.717021226882935, + "mean_norm/layer6": 8.287675678730011, + "mean_norm/layer7": 8.38047194480896, + "mean_norm/layer8": 8.439296841621399, + "mean_norm/layer9": 8.436662912368774, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 950 + }, + { + "epoch": 0.4, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.41965904527810566, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0697402954101562, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8068, + "eval_samples_per_second": 20.412, + "eval_steps_per_second": 0.678, + "step": 950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.42, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1499, + "max_norm": 12.205371856689453, + "max_norm/layer0": 11.665349960327148, + "max_norm/layer1": 11.794570922851562, + "max_norm/layer10": 12.205371856689453, + "max_norm/layer11": 11.683103561401367, + "max_norm/layer12": 11.96533489227295, + "max_norm/layer13": 11.50973892211914, + "max_norm/layer14": 11.985956192016602, + "max_norm/layer15": 11.945061683654785, + "max_norm/layer16": 11.481783866882324, + "max_norm/layer17": 11.784865379333496, + "max_norm/layer18": 11.786661148071289, + "max_norm/layer19": 11.881720542907715, + "max_norm/layer2": 11.518780708312988, + "max_norm/layer20": 11.752313613891602, + "max_norm/layer21": 11.9920015335083, + "max_norm/layer22": 12.204444885253906, + "max_norm/layer23": 11.857336044311523, + "max_norm/layer3": 11.719679832458496, + "max_norm/layer4": 11.798518180847168, + "max_norm/layer5": 11.96689224243164, + "max_norm/layer6": 11.870284080505371, + "max_norm/layer7": 11.738767623901367, + "max_norm/layer8": 11.964406967163086, + "max_norm/layer9": 11.882627487182617, + "mean_norm": 8.453645870089531, + "mean_norm/layer0": 8.3440882563591, + "mean_norm/layer1": 8.363113164901733, + "mean_norm/layer10": 8.465011715888977, + "mean_norm/layer11": 8.501566469669342, + "mean_norm/layer12": 8.526647329330444, + "mean_norm/layer13": 8.4126957654953, + "mean_norm/layer14": 8.477688908576965, + "mean_norm/layer15": 8.52941745519638, + "mean_norm/layer16": 8.408942818641663, + "mean_norm/layer17": 8.486901998519897, + "mean_norm/layer18": 8.393563508987427, + "mean_norm/layer19": 8.395319759845734, + "mean_norm/layer2": 8.187123000621796, + "mean_norm/layer20": 8.431950569152832, + "mean_norm/layer21": 8.430995404720306, + "mean_norm/layer22": 8.57761299610138, + "mean_norm/layer23": 8.598110377788544, + "mean_norm/layer3": 8.570252418518066, + "mean_norm/layer4": 8.400231778621674, + "mean_norm/layer5": 8.75737339258194, + "mean_norm/layer6": 8.30407863855362, + "mean_norm/layer7": 8.400870144367218, + "mean_norm/layer8": 8.463805377483368, + "mean_norm/layer9": 8.460139632225037, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1000 + }, + { + "epoch": 0.42, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4205027114945466, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.066149950027466, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5243, + "eval_samples_per_second": 20.912, + "eval_steps_per_second": 0.694, + "step": 1000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.44, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.137, + "max_norm": 12.26101303100586, + "max_norm/layer0": 11.757697105407715, + "max_norm/layer1": 11.850423812866211, + "max_norm/layer10": 12.26101303100586, + "max_norm/layer11": 11.710984230041504, + "max_norm/layer12": 12.059286117553711, + "max_norm/layer13": 11.577807426452637, + "max_norm/layer14": 12.023432731628418, + "max_norm/layer15": 12.022744178771973, + "max_norm/layer16": 11.563203811645508, + "max_norm/layer17": 11.832247734069824, + "max_norm/layer18": 11.830646514892578, + "max_norm/layer19": 11.917702674865723, + "max_norm/layer2": 11.566544532775879, + "max_norm/layer20": 11.846986770629883, + "max_norm/layer21": 11.974418640136719, + "max_norm/layer22": 12.259807586669922, + "max_norm/layer23": 11.933194160461426, + "max_norm/layer3": 11.790570259094238, + "max_norm/layer4": 11.847346305847168, + "max_norm/layer5": 12.058023452758789, + "max_norm/layer6": 11.934420585632324, + "max_norm/layer7": 11.859853744506836, + "max_norm/layer8": 12.027948379516602, + "max_norm/layer9": 12.007089614868164, + "mean_norm": 8.478731632232666, + "mean_norm/layer0": 8.359271585941315, + "mean_norm/layer1": 8.380109190940857, + "mean_norm/layer10": 8.489783465862274, + "mean_norm/layer11": 8.528929233551025, + "mean_norm/layer12": 8.557556688785553, + "mean_norm/layer13": 8.436564564704895, + "mean_norm/layer14": 8.50514006614685, + "mean_norm/layer15": 8.559872150421143, + "mean_norm/layer16": 8.43321669101715, + "mean_norm/layer17": 8.515621662139893, + "mean_norm/layer18": 8.417644321918488, + "mean_norm/layer19": 8.419948518276215, + "mean_norm/layer2": 8.196061968803406, + "mean_norm/layer20": 8.459028244018555, + "mean_norm/layer21": 8.457358598709106, + "mean_norm/layer22": 8.611605882644653, + "mean_norm/layer23": 8.631408274173737, + "mean_norm/layer3": 8.599063694477081, + "mean_norm/layer4": 8.419784009456635, + "mean_norm/layer5": 8.797651767730713, + "mean_norm/layer6": 8.320107817649841, + "mean_norm/layer7": 8.4212247133255, + "mean_norm/layer8": 8.488442122936249, + "mean_norm/layer9": 8.48416393995285, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1050 + }, + { + "epoch": 0.44, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.42164247210425765, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0529024600982666, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8004, + "eval_samples_per_second": 20.423, + "eval_steps_per_second": 0.678, + "step": 1050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.46, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1325, + "max_norm": 12.337430000305176, + "max_norm/layer0": 11.839350700378418, + "max_norm/layer1": 11.910687446594238, + "max_norm/layer10": 12.316972732543945, + "max_norm/layer11": 11.7444486618042, + "max_norm/layer12": 12.147137641906738, + "max_norm/layer13": 11.644682884216309, + "max_norm/layer14": 12.059837341308594, + "max_norm/layer15": 12.106205940246582, + "max_norm/layer16": 11.641736030578613, + "max_norm/layer17": 11.914681434631348, + "max_norm/layer18": 11.873185157775879, + "max_norm/layer19": 11.963512420654297, + "max_norm/layer2": 11.602706909179688, + "max_norm/layer20": 11.907248497009277, + "max_norm/layer21": 11.956596374511719, + "max_norm/layer22": 12.337430000305176, + "max_norm/layer23": 12.008430480957031, + "max_norm/layer3": 11.857219696044922, + "max_norm/layer4": 11.907477378845215, + "max_norm/layer5": 12.181724548339844, + "max_norm/layer6": 12.007532119750977, + "max_norm/layer7": 12.028894424438477, + "max_norm/layer8": 12.075993537902832, + "max_norm/layer9": 12.120156288146973, + "mean_norm": 8.503541881839434, + "mean_norm/layer0": 8.374323666095734, + "mean_norm/layer1": 8.396947979927063, + "mean_norm/layer10": 8.514197707176208, + "mean_norm/layer11": 8.556173324584961, + "mean_norm/layer12": 8.588340997695923, + "mean_norm/layer13": 8.459864497184753, + "mean_norm/layer14": 8.53289008140564, + "mean_norm/layer15": 8.589832186698914, + "mean_norm/layer16": 8.457439363002777, + "mean_norm/layer17": 8.544645309448242, + "mean_norm/layer18": 8.441946268081665, + "mean_norm/layer19": 8.444604992866516, + "mean_norm/layer2": 8.204352736473083, + "mean_norm/layer20": 8.486289203166962, + "mean_norm/layer21": 8.483921110630035, + "mean_norm/layer22": 8.645121037960052, + "mean_norm/layer23": 8.664347052574158, + "mean_norm/layer3": 8.627211809158325, + "mean_norm/layer4": 8.439228117465973, + "mean_norm/layer5": 8.836770415306091, + "mean_norm/layer6": 8.33525162935257, + "mean_norm/layer7": 8.441284954547882, + "mean_norm/layer8": 8.512612342834473, + "mean_norm/layer9": 8.507408380508423, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1100 + }, + { + "epoch": 0.46, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.422713279225125, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.053382396697998, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8038, + "eval_samples_per_second": 20.417, + "eval_steps_per_second": 0.678, + "step": 1100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.48, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1134, + "max_norm": 12.390501022338867, + "max_norm/layer0": 11.916831016540527, + "max_norm/layer1": 11.991969108581543, + "max_norm/layer10": 12.356989860534668, + "max_norm/layer11": 11.778839111328125, + "max_norm/layer12": 12.239680290222168, + "max_norm/layer13": 11.736593246459961, + "max_norm/layer14": 12.143863677978516, + "max_norm/layer15": 12.180139541625977, + "max_norm/layer16": 11.728737831115723, + "max_norm/layer17": 12.01159381866455, + "max_norm/layer18": 11.933110237121582, + "max_norm/layer19": 12.001410484313965, + "max_norm/layer2": 11.658327102661133, + "max_norm/layer20": 11.978069305419922, + "max_norm/layer21": 11.949234008789062, + "max_norm/layer22": 12.390501022338867, + "max_norm/layer23": 12.06468677520752, + "max_norm/layer3": 11.926894187927246, + "max_norm/layer4": 11.99174976348877, + "max_norm/layer5": 12.265400886535645, + "max_norm/layer6": 12.064791679382324, + "max_norm/layer7": 12.149833679199219, + "max_norm/layer8": 12.13364028930664, + "max_norm/layer9": 12.21767807006836, + "mean_norm": 8.52769010514021, + "mean_norm/layer0": 8.388884007930756, + "mean_norm/layer1": 8.41365897655487, + "mean_norm/layer10": 8.53753811120987, + "mean_norm/layer11": 8.58243614435196, + "mean_norm/layer12": 8.618303418159485, + "mean_norm/layer13": 8.482500731945038, + "mean_norm/layer14": 8.5594362616539, + "mean_norm/layer15": 8.619120597839355, + "mean_norm/layer16": 8.481026113033295, + "mean_norm/layer17": 8.573175191879272, + "mean_norm/layer18": 8.466035664081573, + "mean_norm/layer19": 8.468759298324585, + "mean_norm/layer2": 8.21207869052887, + "mean_norm/layer20": 8.513489484786987, + "mean_norm/layer21": 8.50997406244278, + "mean_norm/layer22": 8.67935174703598, + "mean_norm/layer23": 8.69653707742691, + "mean_norm/layer3": 8.654048144817352, + "mean_norm/layer4": 8.45800656080246, + "mean_norm/layer5": 8.874925374984741, + "mean_norm/layer6": 8.349959671497345, + "mean_norm/layer7": 8.460034430027008, + "mean_norm/layer8": 8.535409569740295, + "mean_norm/layer9": 8.529873192310333, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1150 + }, + { + "epoch": 0.48, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.42448984558474584, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.033704996109009, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5345, + "eval_samples_per_second": 20.894, + "eval_steps_per_second": 0.694, + "step": 1150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.5, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0942, + "max_norm": 12.468120574951172, + "max_norm/layer0": 11.995326042175293, + "max_norm/layer1": 12.067697525024414, + "max_norm/layer10": 12.403990745544434, + "max_norm/layer11": 11.817073822021484, + "max_norm/layer12": 12.339508056640625, + "max_norm/layer13": 11.813336372375488, + "max_norm/layer14": 12.205154418945312, + "max_norm/layer15": 12.247501373291016, + "max_norm/layer16": 11.802889823913574, + "max_norm/layer17": 12.11780834197998, + "max_norm/layer18": 11.991769790649414, + "max_norm/layer19": 12.04055404663086, + "max_norm/layer2": 11.691339492797852, + "max_norm/layer20": 12.061504364013672, + "max_norm/layer21": 11.942378997802734, + "max_norm/layer22": 12.468120574951172, + "max_norm/layer23": 12.125564575195312, + "max_norm/layer3": 12.011069297790527, + "max_norm/layer4": 12.092073440551758, + "max_norm/layer5": 12.332050323486328, + "max_norm/layer6": 12.111506462097168, + "max_norm/layer7": 12.237801551818848, + "max_norm/layer8": 12.18825626373291, + "max_norm/layer9": 12.341841697692871, + "mean_norm": 8.55142513414224, + "mean_norm/layer0": 8.403229653835297, + "mean_norm/layer1": 8.430038452148438, + "mean_norm/layer10": 8.560727715492249, + "mean_norm/layer11": 8.608600378036499, + "mean_norm/layer12": 8.647474765777588, + "mean_norm/layer13": 8.504248023033142, + "mean_norm/layer14": 8.58581668138504, + "mean_norm/layer15": 8.647967278957367, + "mean_norm/layer16": 8.503765046596527, + "mean_norm/layer17": 8.601675927639008, + "mean_norm/layer18": 8.490412592887878, + "mean_norm/layer19": 8.492941200733185, + "mean_norm/layer2": 8.219275295734406, + "mean_norm/layer20": 8.539772391319275, + "mean_norm/layer21": 8.53559297323227, + "mean_norm/layer22": 8.712083876132965, + "mean_norm/layer23": 8.729129493236542, + "mean_norm/layer3": 8.680878758430481, + "mean_norm/layer4": 8.476042687892914, + "mean_norm/layer5": 8.91216629743576, + "mean_norm/layer6": 8.364468932151794, + "mean_norm/layer7": 8.478329598903656, + "mean_norm/layer8": 8.557778775691986, + "mean_norm/layer9": 8.551786422729492, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1200 + }, + { + "epoch": 0.5, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.425163156122867, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0296287536621094, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7916, + "eval_samples_per_second": 20.438, + "eval_steps_per_second": 0.678, + "step": 1200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.52, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.1078, + "max_norm": 12.530866622924805, + "max_norm/layer0": 12.061227798461914, + "max_norm/layer1": 12.141142845153809, + "max_norm/layer10": 12.451057434082031, + "max_norm/layer11": 11.885611534118652, + "max_norm/layer12": 12.420894622802734, + "max_norm/layer13": 11.879868507385254, + "max_norm/layer14": 12.285859107971191, + "max_norm/layer15": 12.319154739379883, + "max_norm/layer16": 11.870779037475586, + "max_norm/layer17": 12.209052085876465, + "max_norm/layer18": 12.042786598205566, + "max_norm/layer19": 12.080160140991211, + "max_norm/layer2": 11.76501178741455, + "max_norm/layer20": 12.142309188842773, + "max_norm/layer21": 12.006357192993164, + "max_norm/layer22": 12.530866622924805, + "max_norm/layer23": 12.205020904541016, + "max_norm/layer3": 12.123080253601074, + "max_norm/layer4": 12.156495094299316, + "max_norm/layer5": 12.430468559265137, + "max_norm/layer6": 12.177638053894043, + "max_norm/layer7": 12.356688499450684, + "max_norm/layer8": 12.309911727905273, + "max_norm/layer9": 12.442432403564453, + "mean_norm": 8.574853877226511, + "mean_norm/layer0": 8.417532444000244, + "mean_norm/layer1": 8.446242809295654, + "mean_norm/layer10": 8.583423614501953, + "mean_norm/layer11": 8.634363651275635, + "mean_norm/layer12": 8.676055133342743, + "mean_norm/layer13": 8.525701999664307, + "mean_norm/layer14": 8.611644744873047, + "mean_norm/layer15": 8.676322281360626, + "mean_norm/layer16": 8.526974976062775, + "mean_norm/layer17": 8.629515528678894, + "mean_norm/layer18": 8.514853537082672, + "mean_norm/layer19": 8.516682028770447, + "mean_norm/layer2": 8.226419508457184, + "mean_norm/layer20": 8.565673828125, + "mean_norm/layer21": 8.56021511554718, + "mean_norm/layer22": 8.744957864284515, + "mean_norm/layer23": 8.761150598526001, + "mean_norm/layer3": 8.706950187683105, + "mean_norm/layer4": 8.49384981393814, + "mean_norm/layer5": 8.949612021446228, + "mean_norm/layer6": 8.378373205661774, + "mean_norm/layer7": 8.496361255645752, + "mean_norm/layer8": 8.580375611782074, + "mean_norm/layer9": 8.573241293430328, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1250 + }, + { + "epoch": 0.52, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4257472327342492, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.0218803882598877, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7879, + "eval_samples_per_second": 20.445, + "eval_steps_per_second": 0.679, + "step": 1250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.54, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.086, + "max_norm": 12.616530418395996, + "max_norm/layer0": 12.120105743408203, + "max_norm/layer1": 12.24160385131836, + "max_norm/layer10": 12.489425659179688, + "max_norm/layer11": 11.951299667358398, + "max_norm/layer12": 12.510804176330566, + "max_norm/layer13": 11.954564094543457, + "max_norm/layer14": 12.374727249145508, + "max_norm/layer15": 12.41003131866455, + "max_norm/layer16": 11.95055866241455, + "max_norm/layer17": 12.313188552856445, + "max_norm/layer18": 12.117609977722168, + "max_norm/layer19": 12.119937896728516, + "max_norm/layer2": 11.798491477966309, + "max_norm/layer20": 12.230223655700684, + "max_norm/layer21": 12.09094524383545, + "max_norm/layer22": 12.616530418395996, + "max_norm/layer23": 12.287936210632324, + "max_norm/layer3": 12.218461990356445, + "max_norm/layer4": 12.223498344421387, + "max_norm/layer5": 12.541898727416992, + "max_norm/layer6": 12.239702224731445, + "max_norm/layer7": 12.441795349121094, + "max_norm/layer8": 12.388147354125977, + "max_norm/layer9": 12.528850555419922, + "mean_norm": 8.597911283373833, + "mean_norm/layer0": 8.4317027926445, + "mean_norm/layer1": 8.461981654167175, + "mean_norm/layer10": 8.605356931686401, + "mean_norm/layer11": 8.659491837024689, + "mean_norm/layer12": 8.704477965831757, + "mean_norm/layer13": 8.547408878803253, + "mean_norm/layer14": 8.637555420398712, + "mean_norm/layer15": 8.704207181930542, + "mean_norm/layer16": 8.54949301481247, + "mean_norm/layer17": 8.657357454299927, + "mean_norm/layer18": 8.539100170135498, + "mean_norm/layer19": 8.540253460407257, + "mean_norm/layer2": 8.23346322774887, + "mean_norm/layer20": 8.592048525810242, + "mean_norm/layer21": 8.585165977478027, + "mean_norm/layer22": 8.777146875858307, + "mean_norm/layer23": 8.792299032211304, + "mean_norm/layer3": 8.732121765613556, + "mean_norm/layer4": 8.511165499687195, + "mean_norm/layer5": 8.986108601093292, + "mean_norm/layer6": 8.391669809818268, + "mean_norm/layer7": 8.513608872890472, + "mean_norm/layer8": 8.602046430110931, + "mean_norm/layer9": 8.594639420509338, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1300 + }, + { + "epoch": 0.54, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.42775093999829644, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.009110927581787, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8152, + "eval_samples_per_second": 20.397, + "eval_steps_per_second": 0.677, + "step": 1300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.56, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0909, + "max_norm": 12.686294555664062, + "max_norm/layer0": 12.181984901428223, + "max_norm/layer1": 12.317867279052734, + "max_norm/layer10": 12.543929100036621, + "max_norm/layer11": 12.017821311950684, + "max_norm/layer12": 12.592409133911133, + "max_norm/layer13": 12.018542289733887, + "max_norm/layer14": 12.431426048278809, + "max_norm/layer15": 12.49692153930664, + "max_norm/layer16": 12.016731262207031, + "max_norm/layer17": 12.427252769470215, + "max_norm/layer18": 12.205350875854492, + "max_norm/layer19": 12.160531044006348, + "max_norm/layer2": 11.837761878967285, + "max_norm/layer20": 12.30910587310791, + "max_norm/layer21": 12.182352066040039, + "max_norm/layer22": 12.686294555664062, + "max_norm/layer23": 12.399474143981934, + "max_norm/layer3": 12.289910316467285, + "max_norm/layer4": 12.31454849243164, + "max_norm/layer5": 12.639134407043457, + "max_norm/layer6": 12.315422058105469, + "max_norm/layer7": 12.572528839111328, + "max_norm/layer8": 12.499512672424316, + "max_norm/layer9": 12.626362800598145, + "mean_norm": 8.62041107316812, + "mean_norm/layer0": 8.445489645004272, + "mean_norm/layer1": 8.477490961551666, + "mean_norm/layer10": 8.626979351043701, + "mean_norm/layer11": 8.683675706386566, + "mean_norm/layer12": 8.732514381408691, + "mean_norm/layer13": 8.567951917648315, + "mean_norm/layer14": 8.662712216377258, + "mean_norm/layer15": 8.731165051460266, + "mean_norm/layer16": 8.571608543395996, + "mean_norm/layer17": 8.684390306472778, + "mean_norm/layer18": 8.562283277511597, + "mean_norm/layer19": 8.563570141792297, + "mean_norm/layer2": 8.239861786365509, + "mean_norm/layer20": 8.617091238498688, + "mean_norm/layer21": 8.609572529792786, + "mean_norm/layer22": 8.809150457382202, + "mean_norm/layer23": 8.823075652122498, + "mean_norm/layer3": 8.756663084030151, + "mean_norm/layer4": 8.528301894664764, + "mean_norm/layer5": 9.021451652050018, + "mean_norm/layer6": 8.404954314231873, + "mean_norm/layer7": 8.530861616134644, + "mean_norm/layer8": 8.623531699180603, + "mean_norm/layer9": 8.61551833152771, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1350 + }, + { + "epoch": 0.56, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4288744762576914, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 3.00097393989563, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8281, + "eval_samples_per_second": 20.375, + "eval_steps_per_second": 0.676, + "step": 1350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.58, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0855, + "max_norm": 12.768488883972168, + "max_norm/layer0": 12.241242408752441, + "max_norm/layer1": 12.424370765686035, + "max_norm/layer10": 12.65182113647461, + "max_norm/layer11": 12.119407653808594, + "max_norm/layer12": 12.677779197692871, + "max_norm/layer13": 12.085238456726074, + "max_norm/layer14": 12.553781509399414, + "max_norm/layer15": 12.58381175994873, + "max_norm/layer16": 12.0853853225708, + "max_norm/layer17": 12.551607131958008, + "max_norm/layer18": 12.261463165283203, + "max_norm/layer19": 12.205509185791016, + "max_norm/layer2": 11.860236167907715, + "max_norm/layer20": 12.388531684875488, + "max_norm/layer21": 12.284324645996094, + "max_norm/layer22": 12.768488883972168, + "max_norm/layer23": 12.490804672241211, + "max_norm/layer3": 12.376986503601074, + "max_norm/layer4": 12.416421890258789, + "max_norm/layer5": 12.763866424560547, + "max_norm/layer6": 12.37830638885498, + "max_norm/layer7": 12.686251640319824, + "max_norm/layer8": 12.616026878356934, + "max_norm/layer9": 12.709514617919922, + "mean_norm": 8.642726625005404, + "mean_norm/layer0": 8.45906376838684, + "mean_norm/layer1": 8.49306035041809, + "mean_norm/layer10": 8.64819061756134, + "mean_norm/layer11": 8.707186877727509, + "mean_norm/layer12": 8.760173201560974, + "mean_norm/layer13": 8.58885395526886, + "mean_norm/layer14": 8.687394678592682, + "mean_norm/layer15": 8.758006572723389, + "mean_norm/layer16": 8.593712091445923, + "mean_norm/layer17": 8.711206674575806, + "mean_norm/layer18": 8.585395872592926, + "mean_norm/layer19": 8.587033748626709, + "mean_norm/layer2": 8.246377110481262, + "mean_norm/layer20": 8.6430304646492, + "mean_norm/layer21": 8.633982956409454, + "mean_norm/layer22": 8.84108155965805, + "mean_norm/layer23": 8.853368699550629, + "mean_norm/layer3": 8.7816281914711, + "mean_norm/layer4": 8.544718623161316, + "mean_norm/layer5": 9.056117296218872, + "mean_norm/layer6": 8.417579352855682, + "mean_norm/layer7": 8.547739028930664, + "mean_norm/layer8": 8.644529163837433, + "mean_norm/layer9": 8.636008143424988, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1400 + }, + { + "epoch": 0.58, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.428842027557059, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.993396043777466, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5577, + "eval_samples_per_second": 20.852, + "eval_steps_per_second": 0.692, + "step": 1400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.61, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.065, + "max_norm": 12.911163330078125, + "max_norm/layer0": 12.293036460876465, + "max_norm/layer1": 12.547085762023926, + "max_norm/layer10": 12.76215648651123, + "max_norm/layer11": 12.25842571258545, + "max_norm/layer12": 12.75853443145752, + "max_norm/layer13": 12.15564250946045, + "max_norm/layer14": 12.656801223754883, + "max_norm/layer15": 12.706408500671387, + "max_norm/layer16": 12.161219596862793, + "max_norm/layer17": 12.7056245803833, + "max_norm/layer18": 12.327484130859375, + "max_norm/layer19": 12.249855995178223, + "max_norm/layer2": 11.891606330871582, + "max_norm/layer20": 12.475489616394043, + "max_norm/layer21": 12.39600944519043, + "max_norm/layer22": 12.857209205627441, + "max_norm/layer23": 12.605290412902832, + "max_norm/layer3": 12.465520858764648, + "max_norm/layer4": 12.489715576171875, + "max_norm/layer5": 12.911163330078125, + "max_norm/layer6": 12.437993049621582, + "max_norm/layer7": 12.785067558288574, + "max_norm/layer8": 12.7163667678833, + "max_norm/layer9": 12.821453094482422, + "mean_norm": 8.664971977472305, + "mean_norm/layer0": 8.472568154335022, + "mean_norm/layer1": 8.508402287960052, + "mean_norm/layer10": 8.669077575206757, + "mean_norm/layer11": 8.730392575263977, + "mean_norm/layer12": 8.787680089473724, + "mean_norm/layer13": 8.609262645244598, + "mean_norm/layer14": 8.711707293987274, + "mean_norm/layer15": 8.78460282087326, + "mean_norm/layer16": 8.616038620471954, + "mean_norm/layer17": 8.738197267055511, + "mean_norm/layer18": 8.608790636062622, + "mean_norm/layer19": 8.610539197921753, + "mean_norm/layer2": 8.253041744232178, + "mean_norm/layer20": 8.669034600257874, + "mean_norm/layer21": 8.65846562385559, + "mean_norm/layer22": 8.872988402843475, + "mean_norm/layer23": 8.883999526500702, + "mean_norm/layer3": 8.80587100982666, + "mean_norm/layer4": 8.561438500881195, + "mean_norm/layer5": 9.091051876544952, + "mean_norm/layer6": 8.430066585540771, + "mean_norm/layer7": 8.564611732959747, + "mean_norm/layer8": 8.66524201631546, + "mean_norm/layer9": 8.656256675720215, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1450 + }, + { + "epoch": 0.61, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4306429304421541, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.986873149871826, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5366, + "eval_samples_per_second": 20.89, + "eval_steps_per_second": 0.693, + "step": 1450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.63, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0722, + "max_norm": 13.059762001037598, + "max_norm/layer0": 12.345417022705078, + "max_norm/layer1": 12.659737586975098, + "max_norm/layer10": 12.856481552124023, + "max_norm/layer11": 12.383923530578613, + "max_norm/layer12": 12.854155540466309, + "max_norm/layer13": 12.24963665008545, + "max_norm/layer14": 12.79176139831543, + "max_norm/layer15": 12.82961368560791, + "max_norm/layer16": 12.242087364196777, + "max_norm/layer17": 12.827202796936035, + "max_norm/layer18": 12.374549865722656, + "max_norm/layer19": 12.30087661743164, + "max_norm/layer2": 11.919795989990234, + "max_norm/layer20": 12.611680030822754, + "max_norm/layer21": 12.485276222229004, + "max_norm/layer22": 12.907124519348145, + "max_norm/layer23": 12.714141845703125, + "max_norm/layer3": 12.535303115844727, + "max_norm/layer4": 12.54542064666748, + "max_norm/layer5": 13.059762001037598, + "max_norm/layer6": 12.518970489501953, + "max_norm/layer7": 12.897445678710938, + "max_norm/layer8": 12.807401657104492, + "max_norm/layer9": 12.903473854064941, + "mean_norm": 8.68662746498982, + "mean_norm/layer0": 8.48574846982956, + "mean_norm/layer1": 8.523551344871521, + "mean_norm/layer10": 8.689225196838379, + "mean_norm/layer11": 8.753485918045044, + "mean_norm/layer12": 8.814705193042755, + "mean_norm/layer13": 8.629233002662659, + "mean_norm/layer14": 8.735382556915283, + "mean_norm/layer15": 8.810544908046722, + "mean_norm/layer16": 8.637446343898773, + "mean_norm/layer17": 8.764160871505737, + "mean_norm/layer18": 8.63146036863327, + "mean_norm/layer19": 8.63357812166214, + "mean_norm/layer2": 8.259207248687744, + "mean_norm/layer20": 8.694165408611298, + "mean_norm/layer21": 8.681831121444702, + "mean_norm/layer22": 8.90420150756836, + "mean_norm/layer23": 8.914546489715576, + "mean_norm/layer3": 8.829843997955322, + "mean_norm/layer4": 8.577266812324524, + "mean_norm/layer5": 9.12503045797348, + "mean_norm/layer6": 8.442515015602112, + "mean_norm/layer7": 8.580586612224579, + "mean_norm/layer8": 8.685438334941864, + "mean_norm/layer9": 8.675903856754303, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1500 + }, + { + "epoch": 0.63, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4305942573912056, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9838168621063232, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5335, + "eval_samples_per_second": 20.896, + "eval_steps_per_second": 0.694, + "step": 1500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.65, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0536, + "max_norm": 13.204683303833008, + "max_norm/layer0": 12.397311210632324, + "max_norm/layer1": 12.771734237670898, + "max_norm/layer10": 12.999382019042969, + "max_norm/layer11": 12.556604385375977, + "max_norm/layer12": 12.944580078125, + "max_norm/layer13": 12.302048683166504, + "max_norm/layer14": 12.901226043701172, + "max_norm/layer15": 12.932552337646484, + "max_norm/layer16": 12.336416244506836, + "max_norm/layer17": 12.978598594665527, + "max_norm/layer18": 12.42466926574707, + "max_norm/layer19": 12.365293502807617, + "max_norm/layer2": 11.952788352966309, + "max_norm/layer20": 12.757342338562012, + "max_norm/layer21": 12.583632469177246, + "max_norm/layer22": 12.97545051574707, + "max_norm/layer23": 12.805314064025879, + "max_norm/layer3": 12.61535358428955, + "max_norm/layer4": 12.621912956237793, + "max_norm/layer5": 13.204683303833008, + "max_norm/layer6": 12.58818531036377, + "max_norm/layer7": 12.9867525100708, + "max_norm/layer8": 12.903141021728516, + "max_norm/layer9": 13.003826141357422, + "mean_norm": 8.707863385478655, + "mean_norm/layer0": 8.498963057994843, + "mean_norm/layer1": 8.538367092609406, + "mean_norm/layer10": 8.70906138420105, + "mean_norm/layer11": 8.776423811912537, + "mean_norm/layer12": 8.841421246528625, + "mean_norm/layer13": 8.649191439151764, + "mean_norm/layer14": 8.758762776851654, + "mean_norm/layer15": 8.83595359325409, + "mean_norm/layer16": 8.658472955226898, + "mean_norm/layer17": 8.789756417274475, + "mean_norm/layer18": 8.654428124427795, + "mean_norm/layer19": 8.656601250171661, + "mean_norm/layer2": 8.265197396278381, + "mean_norm/layer20": 8.719094395637512, + "mean_norm/layer21": 8.704816818237305, + "mean_norm/layer22": 8.934785842895508, + "mean_norm/layer23": 8.943950235843658, + "mean_norm/layer3": 8.853420853614807, + "mean_norm/layer4": 8.591943502426147, + "mean_norm/layer5": 9.157538950443268, + "mean_norm/layer6": 8.45427131652832, + "mean_norm/layer7": 8.59613686800003, + "mean_norm/layer8": 8.705270826816559, + "mean_norm/layer9": 8.694891095161438, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1550 + }, + { + "epoch": 0.65, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43009130253140426, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.982506036758423, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7956, + "eval_samples_per_second": 20.431, + "eval_steps_per_second": 0.678, + "step": 1550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.67, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0505, + "max_norm": 13.3615140914917, + "max_norm/layer0": 12.517741203308105, + "max_norm/layer1": 12.865513801574707, + "max_norm/layer10": 13.127941131591797, + "max_norm/layer11": 12.687420845031738, + "max_norm/layer12": 13.030386924743652, + "max_norm/layer13": 12.377881050109863, + "max_norm/layer14": 13.030510902404785, + "max_norm/layer15": 13.021608352661133, + "max_norm/layer16": 12.415884971618652, + "max_norm/layer17": 13.139957427978516, + "max_norm/layer18": 12.48414134979248, + "max_norm/layer19": 12.458990097045898, + "max_norm/layer2": 11.990442276000977, + "max_norm/layer20": 12.859320640563965, + "max_norm/layer21": 12.669166564941406, + "max_norm/layer22": 13.055481910705566, + "max_norm/layer23": 12.907835006713867, + "max_norm/layer3": 12.686458587646484, + "max_norm/layer4": 12.707650184631348, + "max_norm/layer5": 13.3615140914917, + "max_norm/layer6": 12.65063190460205, + "max_norm/layer7": 13.089656829833984, + "max_norm/layer8": 13.009183883666992, + "max_norm/layer9": 13.109399795532227, + "mean_norm": 8.728878619770208, + "mean_norm/layer0": 8.511847734451294, + "mean_norm/layer1": 8.553039729595184, + "mean_norm/layer10": 8.729139029979706, + "mean_norm/layer11": 8.798815786838531, + "mean_norm/layer12": 8.867528319358826, + "mean_norm/layer13": 8.668808817863464, + "mean_norm/layer14": 8.782176852226257, + "mean_norm/layer15": 8.861507177352905, + "mean_norm/layer16": 8.679296255111694, + "mean_norm/layer17": 8.815626800060272, + "mean_norm/layer18": 8.677160620689392, + "mean_norm/layer19": 8.679296314716339, + "mean_norm/layer2": 8.271026909351349, + "mean_norm/layer20": 8.743983507156372, + "mean_norm/layer21": 8.727519035339355, + "mean_norm/layer22": 8.9653200507164, + "mean_norm/layer23": 8.97294557094574, + "mean_norm/layer3": 8.87597405910492, + "mean_norm/layer4": 8.607149243354797, + "mean_norm/layer5": 9.19001019001007, + "mean_norm/layer6": 8.466087341308594, + "mean_norm/layer7": 8.611168026924133, + "mean_norm/layer8": 8.724406242370605, + "mean_norm/layer9": 8.713253259658813, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1600 + }, + { + "epoch": 0.67, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4306591547924703, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9796295166015625, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8191, + "eval_samples_per_second": 20.391, + "eval_steps_per_second": 0.677, + "step": 1600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.69, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0475, + "max_norm": 13.540763854980469, + "max_norm/layer0": 12.632498741149902, + "max_norm/layer1": 12.943493843078613, + "max_norm/layer10": 13.258481979370117, + "max_norm/layer11": 12.811452865600586, + "max_norm/layer12": 13.11585807800293, + "max_norm/layer13": 12.44717025756836, + "max_norm/layer14": 13.164324760437012, + "max_norm/layer15": 13.170096397399902, + "max_norm/layer16": 12.488635063171387, + "max_norm/layer17": 13.308391571044922, + "max_norm/layer18": 12.548270225524902, + "max_norm/layer19": 12.54361629486084, + "max_norm/layer2": 12.023127555847168, + "max_norm/layer20": 12.954742431640625, + "max_norm/layer21": 12.747000694274902, + "max_norm/layer22": 13.133721351623535, + "max_norm/layer23": 13.020496368408203, + "max_norm/layer3": 12.763312339782715, + "max_norm/layer4": 12.796082496643066, + "max_norm/layer5": 13.540763854980469, + "max_norm/layer6": 12.707022666931152, + "max_norm/layer7": 13.211490631103516, + "max_norm/layer8": 13.115765571594238, + "max_norm/layer9": 13.189752578735352, + "mean_norm": 8.749427725871405, + "mean_norm/layer0": 8.52438485622406, + "mean_norm/layer1": 8.567584753036499, + "mean_norm/layer10": 8.74834829568863, + "mean_norm/layer11": 8.820571064949036, + "mean_norm/layer12": 8.892871975898743, + "mean_norm/layer13": 8.687913954257965, + "mean_norm/layer14": 8.805040657520294, + "mean_norm/layer15": 8.88647973537445, + "mean_norm/layer16": 8.699283361434937, + "mean_norm/layer17": 8.841068029403687, + "mean_norm/layer18": 8.699337124824524, + "mean_norm/layer19": 8.701597511768341, + "mean_norm/layer2": 8.277015924453735, + "mean_norm/layer20": 8.768545150756836, + "mean_norm/layer21": 8.749671161174774, + "mean_norm/layer22": 8.995070099830627, + "mean_norm/layer23": 9.001830399036407, + "mean_norm/layer3": 8.898363590240479, + "mean_norm/layer4": 8.62207943201065, + "mean_norm/layer5": 9.221762597560883, + "mean_norm/layer6": 8.477177321910858, + "mean_norm/layer7": 8.626116931438446, + "mean_norm/layer8": 8.743105173110962, + "mean_norm/layer9": 8.731046319007874, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1650 + }, + { + "epoch": 0.69, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4328169933845212, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9699418544769287, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7962, + "eval_samples_per_second": 20.43, + "eval_steps_per_second": 0.678, + "step": 1650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.71, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0322, + "max_norm": 13.67343807220459, + "max_norm/layer0": 12.717508316040039, + "max_norm/layer1": 13.026078224182129, + "max_norm/layer10": 13.373031616210938, + "max_norm/layer11": 12.978168487548828, + "max_norm/layer12": 13.207404136657715, + "max_norm/layer13": 12.527669906616211, + "max_norm/layer14": 13.306821823120117, + "max_norm/layer15": 13.35703182220459, + "max_norm/layer16": 12.5789155960083, + "max_norm/layer17": 13.446418762207031, + "max_norm/layer18": 12.62332534790039, + "max_norm/layer19": 12.609963417053223, + "max_norm/layer2": 12.068394660949707, + "max_norm/layer20": 13.062036514282227, + "max_norm/layer21": 12.836729049682617, + "max_norm/layer22": 13.222061157226562, + "max_norm/layer23": 13.132906913757324, + "max_norm/layer3": 12.828428268432617, + "max_norm/layer4": 12.867692947387695, + "max_norm/layer5": 13.67343807220459, + "max_norm/layer6": 12.808048248291016, + "max_norm/layer7": 13.316970825195312, + "max_norm/layer8": 13.244258880615234, + "max_norm/layer9": 13.288371086120605, + "mean_norm": 8.769363696376482, + "mean_norm/layer0": 8.536643624305725, + "mean_norm/layer1": 8.581710577011108, + "mean_norm/layer10": 8.76716548204422, + "mean_norm/layer11": 8.841660916805267, + "mean_norm/layer12": 8.917559087276459, + "mean_norm/layer13": 8.706561088562012, + "mean_norm/layer14": 8.82697319984436, + "mean_norm/layer15": 8.910794138908386, + "mean_norm/layer16": 8.71890926361084, + "mean_norm/layer17": 8.8657585978508, + "mean_norm/layer18": 8.72101479768753, + "mean_norm/layer19": 8.723503530025482, + "mean_norm/layer2": 8.282784938812256, + "mean_norm/layer20": 8.791405975818634, + "mean_norm/layer21": 8.771677851676941, + "mean_norm/layer22": 9.024154126644135, + "mean_norm/layer23": 9.02972674369812, + "mean_norm/layer3": 8.919883489608765, + "mean_norm/layer4": 8.636090219020844, + "mean_norm/layer5": 9.252493143081665, + "mean_norm/layer6": 8.487660467624664, + "mean_norm/layer7": 8.640743553638458, + "mean_norm/layer8": 8.761323869228363, + "mean_norm/layer9": 8.74853003025055, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1700 + }, + { + "epoch": 0.71, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43344974304685185, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.96112060546875, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5347, + "eval_samples_per_second": 20.893, + "eval_steps_per_second": 0.694, + "step": 1700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.73, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0316, + "max_norm": 13.7894926071167, + "max_norm/layer0": 12.797962188720703, + "max_norm/layer1": 13.098018646240234, + "max_norm/layer10": 13.477941513061523, + "max_norm/layer11": 13.097651481628418, + "max_norm/layer12": 13.281977653503418, + "max_norm/layer13": 12.603769302368164, + "max_norm/layer14": 13.395450592041016, + "max_norm/layer15": 13.554838180541992, + "max_norm/layer16": 12.664692878723145, + "max_norm/layer17": 13.577613830566406, + "max_norm/layer18": 12.694923400878906, + "max_norm/layer19": 12.688633918762207, + "max_norm/layer2": 12.093019485473633, + "max_norm/layer20": 13.206803321838379, + "max_norm/layer21": 12.924551010131836, + "max_norm/layer22": 13.276300430297852, + "max_norm/layer23": 13.243668556213379, + "max_norm/layer3": 12.960731506347656, + "max_norm/layer4": 12.94802188873291, + "max_norm/layer5": 13.7894926071167, + "max_norm/layer6": 12.89012622833252, + "max_norm/layer7": 13.404141426086426, + "max_norm/layer8": 13.369832038879395, + "max_norm/layer9": 13.391281127929688, + "mean_norm": 8.78863892952601, + "mean_norm/layer0": 8.54848575592041, + "mean_norm/layer1": 8.595603168010712, + "mean_norm/layer10": 8.785156428813934, + "mean_norm/layer11": 8.8616703748703, + "mean_norm/layer12": 8.941543579101562, + "mean_norm/layer13": 8.724583804607391, + "mean_norm/layer14": 8.848139107227325, + "mean_norm/layer15": 8.934328258037567, + "mean_norm/layer16": 8.738065421581268, + "mean_norm/layer17": 8.889622032642365, + "mean_norm/layer18": 8.742164075374603, + "mean_norm/layer19": 8.744739770889282, + "mean_norm/layer2": 8.288312077522278, + "mean_norm/layer20": 8.814082443714142, + "mean_norm/layer21": 8.792964518070221, + "mean_norm/layer22": 9.052066385746002, + "mean_norm/layer23": 9.05666446685791, + "mean_norm/layer3": 8.940515279769897, + "mean_norm/layer4": 8.64976292848587, + "mean_norm/layer5": 9.281967520713806, + "mean_norm/layer6": 8.497880458831787, + "mean_norm/layer7": 8.654960215091705, + "mean_norm/layer8": 8.778730392456055, + "mean_norm/layer9": 8.765325844287872, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1750 + }, + { + "epoch": 0.73, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43388374441780947, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9500808715820312, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.803, + "eval_samples_per_second": 20.419, + "eval_steps_per_second": 0.678, + "step": 1750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.75, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.02, + "max_norm": 13.906452178955078, + "max_norm/layer0": 12.882908821105957, + "max_norm/layer1": 13.187368392944336, + "max_norm/layer10": 13.588659286499023, + "max_norm/layer11": 13.258871078491211, + "max_norm/layer12": 13.408331871032715, + "max_norm/layer13": 12.65833568572998, + "max_norm/layer14": 13.496163368225098, + "max_norm/layer15": 13.707235336303711, + "max_norm/layer16": 12.777694702148438, + "max_norm/layer17": 13.714956283569336, + "max_norm/layer18": 12.791309356689453, + "max_norm/layer19": 12.784247398376465, + "max_norm/layer2": 12.128005027770996, + "max_norm/layer20": 13.322413444519043, + "max_norm/layer21": 13.02280330657959, + "max_norm/layer22": 13.338006973266602, + "max_norm/layer23": 13.346099853515625, + "max_norm/layer3": 13.023100852966309, + "max_norm/layer4": 13.038986206054688, + "max_norm/layer5": 13.906452178955078, + "max_norm/layer6": 13.03666877746582, + "max_norm/layer7": 13.498882293701172, + "max_norm/layer8": 13.546557426452637, + "max_norm/layer9": 13.48300552368164, + "mean_norm": 8.807754442095757, + "mean_norm/layer0": 8.560234010219574, + "mean_norm/layer1": 8.609053313732147, + "mean_norm/layer10": 8.802674889564514, + "mean_norm/layer11": 8.881379961967468, + "mean_norm/layer12": 8.965039670467377, + "mean_norm/layer13": 8.74233728647232, + "mean_norm/layer14": 8.869293451309204, + "mean_norm/layer15": 8.957258760929108, + "mean_norm/layer16": 8.757313013076782, + "mean_norm/layer17": 8.913440644741058, + "mean_norm/layer18": 8.763157367706299, + "mean_norm/layer19": 8.765839517116547, + "mean_norm/layer2": 8.293516039848328, + "mean_norm/layer20": 8.836040437221527, + "mean_norm/layer21": 8.81434577703476, + "mean_norm/layer22": 9.0809645652771, + "mean_norm/layer23": 9.083868980407715, + "mean_norm/layer3": 8.96069985628128, + "mean_norm/layer4": 8.663160383701324, + "mean_norm/layer5": 9.310991764068604, + "mean_norm/layer6": 8.508190274238586, + "mean_norm/layer7": 8.669151663780212, + "mean_norm/layer8": 8.796195685863495, + "mean_norm/layer9": 8.781959295272827, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1800 + }, + { + "epoch": 0.75, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43465034497024857, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9467976093292236, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5398, + "eval_samples_per_second": 20.884, + "eval_steps_per_second": 0.693, + "step": 1800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.77, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0245, + "max_norm": 14.01785659790039, + "max_norm/layer0": 12.971237182617188, + "max_norm/layer1": 13.28554630279541, + "max_norm/layer10": 13.687850952148438, + "max_norm/layer11": 13.372243881225586, + "max_norm/layer12": 13.521031379699707, + "max_norm/layer13": 12.716824531555176, + "max_norm/layer14": 13.601958274841309, + "max_norm/layer15": 13.830903053283691, + "max_norm/layer16": 12.890148162841797, + "max_norm/layer17": 13.841341018676758, + "max_norm/layer18": 12.844350814819336, + "max_norm/layer19": 12.881791114807129, + "max_norm/layer2": 12.16059398651123, + "max_norm/layer20": 13.44249439239502, + "max_norm/layer21": 13.136921882629395, + "max_norm/layer22": 13.400025367736816, + "max_norm/layer23": 13.452230453491211, + "max_norm/layer3": 13.076272010803223, + "max_norm/layer4": 13.150069236755371, + "max_norm/layer5": 14.01785659790039, + "max_norm/layer6": 13.116811752319336, + "max_norm/layer7": 13.590741157531738, + "max_norm/layer8": 13.703124046325684, + "max_norm/layer9": 13.586084365844727, + "mean_norm": 8.82675089687109, + "mean_norm/layer0": 8.572085976600647, + "mean_norm/layer1": 8.62241667509079, + "mean_norm/layer10": 8.82029390335083, + "mean_norm/layer11": 8.901059448719025, + "mean_norm/layer12": 8.988628685474396, + "mean_norm/layer13": 8.75994199514389, + "mean_norm/layer14": 8.890415966510773, + "mean_norm/layer15": 8.980129182338715, + "mean_norm/layer16": 8.776431798934937, + "mean_norm/layer17": 8.936899721622467, + "mean_norm/layer18": 8.784013092517853, + "mean_norm/layer19": 8.786966979503632, + "mean_norm/layer2": 8.298439383506775, + "mean_norm/layer20": 8.858497023582458, + "mean_norm/layer21": 8.83534300327301, + "mean_norm/layer22": 9.109531104564667, + "mean_norm/layer23": 9.110761523246765, + "mean_norm/layer3": 8.980851411819458, + "mean_norm/layer4": 8.676248848438263, + "mean_norm/layer5": 9.340028464794159, + "mean_norm/layer6": 8.518348813056946, + "mean_norm/layer7": 8.682745039463043, + "mean_norm/layer8": 8.81353086233139, + "mean_norm/layer9": 8.79841262102127, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1850 + }, + { + "epoch": 0.77, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4355183477121638, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.940542697906494, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8237, + "eval_samples_per_second": 20.383, + "eval_steps_per_second": 0.677, + "step": 1850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.79, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0247, + "max_norm": 14.138656616210938, + "max_norm/layer0": 13.052218437194824, + "max_norm/layer1": 13.381721496582031, + "max_norm/layer10": 13.791936874389648, + "max_norm/layer11": 13.474544525146484, + "max_norm/layer12": 13.667418479919434, + "max_norm/layer13": 12.79587459564209, + "max_norm/layer14": 13.703073501586914, + "max_norm/layer15": 13.987411499023438, + "max_norm/layer16": 12.992448806762695, + "max_norm/layer17": 13.965337753295898, + "max_norm/layer18": 12.948287010192871, + "max_norm/layer19": 12.983268737792969, + "max_norm/layer2": 12.176477432250977, + "max_norm/layer20": 13.5822172164917, + "max_norm/layer21": 13.263895034790039, + "max_norm/layer22": 13.479641914367676, + "max_norm/layer23": 13.553653717041016, + "max_norm/layer3": 13.128030776977539, + "max_norm/layer4": 13.215946197509766, + "max_norm/layer5": 14.138656616210938, + "max_norm/layer6": 13.19811725616455, + "max_norm/layer7": 13.667899131774902, + "max_norm/layer8": 13.788747787475586, + "max_norm/layer9": 13.685811996459961, + "mean_norm": 8.845184216896692, + "mean_norm/layer0": 8.5836620926857, + "mean_norm/layer1": 8.635238826274872, + "mean_norm/layer10": 8.837403535842896, + "mean_norm/layer11": 8.920144736766815, + "mean_norm/layer12": 9.011907458305359, + "mean_norm/layer13": 8.777201354503632, + "mean_norm/layer14": 8.910749077796936, + "mean_norm/layer15": 9.002386212348938, + "mean_norm/layer16": 8.794780671596527, + "mean_norm/layer17": 8.959879457950592, + "mean_norm/layer18": 8.804102182388306, + "mean_norm/layer19": 8.807617962360382, + "mean_norm/layer2": 8.303315997123718, + "mean_norm/layer20": 8.88015216588974, + "mean_norm/layer21": 8.855957210063934, + "mean_norm/layer22": 9.13687926530838, + "mean_norm/layer23": 9.136677742004395, + "mean_norm/layer3": 9.000433564186096, + "mean_norm/layer4": 8.689013838768005, + "mean_norm/layer5": 9.368463218212128, + "mean_norm/layer6": 8.527889966964722, + "mean_norm/layer7": 8.695912837982178, + "mean_norm/layer8": 8.830221474170685, + "mean_norm/layer9": 8.814430356025696, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1900 + }, + { + "epoch": 0.79, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.436199770425443, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9340319633483887, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5963, + "eval_samples_per_second": 20.782, + "eval_steps_per_second": 0.69, + "step": 1900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.81, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0201, + "max_norm": 14.271653175354004, + "max_norm/layer0": 13.13520622253418, + "max_norm/layer1": 13.476064682006836, + "max_norm/layer10": 13.901469230651855, + "max_norm/layer11": 13.575247764587402, + "max_norm/layer12": 13.7691650390625, + "max_norm/layer13": 12.850029945373535, + "max_norm/layer14": 13.810707092285156, + "max_norm/layer15": 14.146288871765137, + "max_norm/layer16": 13.090737342834473, + "max_norm/layer17": 14.088882446289062, + "max_norm/layer18": 13.102824211120605, + "max_norm/layer19": 13.057214736938477, + "max_norm/layer2": 12.24477767944336, + "max_norm/layer20": 13.693897247314453, + "max_norm/layer21": 13.370636940002441, + "max_norm/layer22": 13.551177978515625, + "max_norm/layer23": 13.672248840332031, + "max_norm/layer3": 13.1995267868042, + "max_norm/layer4": 13.299997329711914, + "max_norm/layer5": 14.271653175354004, + "max_norm/layer6": 13.269554138183594, + "max_norm/layer7": 13.732311248779297, + "max_norm/layer8": 13.88916015625, + "max_norm/layer9": 13.77952766418457, + "mean_norm": 8.863051029543081, + "mean_norm/layer0": 8.594872176647186, + "mean_norm/layer1": 8.648047864437103, + "mean_norm/layer10": 8.853616833686829, + "mean_norm/layer11": 8.938627779483795, + "mean_norm/layer12": 9.034486055374146, + "mean_norm/layer13": 8.793805718421936, + "mean_norm/layer14": 8.930472075939178, + "mean_norm/layer15": 9.02397906780243, + "mean_norm/layer16": 8.81262332201004, + "mean_norm/layer17": 8.982100486755371, + "mean_norm/layer18": 8.823445796966553, + "mean_norm/layer19": 8.827480673789978, + "mean_norm/layer2": 8.308004558086395, + "mean_norm/layer20": 8.901043772697449, + "mean_norm/layer21": 8.875850260257721, + "mean_norm/layer22": 9.163272619247437, + "mean_norm/layer23": 9.16199541091919, + "mean_norm/layer3": 9.019525945186615, + "mean_norm/layer4": 8.701404392719269, + "mean_norm/layer5": 9.396052300930023, + "mean_norm/layer6": 8.537376403808594, + "mean_norm/layer7": 8.708706319332123, + "mean_norm/layer8": 8.846332848072052, + "mean_norm/layer9": 8.830102026462555, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 1950 + }, + { + "epoch": 0.81, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4370839975176744, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9285225868225098, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8013, + "eval_samples_per_second": 20.421, + "eval_steps_per_second": 0.678, + "step": 1950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.84, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.0107, + "max_norm": 14.383659362792969, + "max_norm/layer0": 13.219470977783203, + "max_norm/layer1": 13.575953483581543, + "max_norm/layer10": 14.011261940002441, + "max_norm/layer11": 13.69066333770752, + "max_norm/layer12": 13.898682594299316, + "max_norm/layer13": 12.897134780883789, + "max_norm/layer14": 13.895804405212402, + "max_norm/layer15": 14.285606384277344, + "max_norm/layer16": 13.165793418884277, + "max_norm/layer17": 14.2105712890625, + "max_norm/layer18": 13.221928596496582, + "max_norm/layer19": 13.153519630432129, + "max_norm/layer2": 12.27010440826416, + "max_norm/layer20": 13.807734489440918, + "max_norm/layer21": 13.467498779296875, + "max_norm/layer22": 13.61931324005127, + "max_norm/layer23": 13.794743537902832, + "max_norm/layer3": 13.270720481872559, + "max_norm/layer4": 13.370405197143555, + "max_norm/layer5": 14.383659362792969, + "max_norm/layer6": 13.332939147949219, + "max_norm/layer7": 13.822017669677734, + "max_norm/layer8": 13.997716903686523, + "max_norm/layer9": 13.877385139465332, + "mean_norm": 8.880738290647665, + "mean_norm/layer0": 8.60589337348938, + "mean_norm/layer1": 8.660571813583374, + "mean_norm/layer10": 8.86993956565857, + "mean_norm/layer11": 8.956714928150177, + "mean_norm/layer12": 9.056580424308777, + "mean_norm/layer13": 8.810520350933075, + "mean_norm/layer14": 8.950220763683319, + "mean_norm/layer15": 9.045172274112701, + "mean_norm/layer16": 8.83077585697174, + "mean_norm/layer17": 9.004396915435791, + "mean_norm/layer18": 8.842631757259369, + "mean_norm/layer19": 8.847141087055206, + "mean_norm/layer2": 8.312703967094421, + "mean_norm/layer20": 8.92222511768341, + "mean_norm/layer21": 8.895317256450653, + "mean_norm/layer22": 9.189109563827515, + "mean_norm/layer23": 9.187323927879333, + "mean_norm/layer3": 9.038133919239044, + "mean_norm/layer4": 8.713449716567993, + "mean_norm/layer5": 9.423080027103424, + "mean_norm/layer6": 8.546690106391907, + "mean_norm/layer7": 8.72130572795868, + "mean_norm/layer8": 8.862245798110962, + "mean_norm/layer9": 8.845574736595154, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2000 + }, + { + "epoch": 0.84, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43821158986464837, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9188804626464844, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7928, + "eval_samples_per_second": 20.436, + "eval_steps_per_second": 0.678, + "step": 2000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.86, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 3.003, + "max_norm": 14.526294708251953, + "max_norm/layer0": 13.318120956420898, + "max_norm/layer1": 13.691896438598633, + "max_norm/layer10": 14.119477272033691, + "max_norm/layer11": 13.802632331848145, + "max_norm/layer12": 13.983503341674805, + "max_norm/layer13": 12.947667121887207, + "max_norm/layer14": 14.012450218200684, + "max_norm/layer15": 14.473040580749512, + "max_norm/layer16": 13.238360404968262, + "max_norm/layer17": 14.329521179199219, + "max_norm/layer18": 13.304075241088867, + "max_norm/layer19": 13.220603942871094, + "max_norm/layer2": 12.33705997467041, + "max_norm/layer20": 13.91451358795166, + "max_norm/layer21": 13.595061302185059, + "max_norm/layer22": 13.679491996765137, + "max_norm/layer23": 13.914533615112305, + "max_norm/layer3": 13.341594696044922, + "max_norm/layer4": 13.453817367553711, + "max_norm/layer5": 14.526294708251953, + "max_norm/layer6": 13.413007736206055, + "max_norm/layer7": 13.901131629943848, + "max_norm/layer8": 14.125232696533203, + "max_norm/layer9": 13.965437889099121, + "mean_norm": 8.898506715893745, + "mean_norm/layer0": 8.61709862947464, + "mean_norm/layer1": 8.673097789287567, + "mean_norm/layer10": 8.886326968669891, + "mean_norm/layer11": 8.975116968154907, + "mean_norm/layer12": 9.078686237335205, + "mean_norm/layer13": 8.826960861682892, + "mean_norm/layer14": 8.969876110553741, + "mean_norm/layer15": 9.066643118858337, + "mean_norm/layer16": 8.848939836025238, + "mean_norm/layer17": 9.026445209980011, + "mean_norm/layer18": 8.862169206142426, + "mean_norm/layer19": 8.867026507854462, + "mean_norm/layer2": 8.317440271377563, + "mean_norm/layer20": 8.943169057369232, + "mean_norm/layer21": 8.91546756029129, + "mean_norm/layer22": 9.215493023395538, + "mean_norm/layer23": 9.21242493391037, + "mean_norm/layer3": 9.056794881820679, + "mean_norm/layer4": 8.725628674030304, + "mean_norm/layer5": 9.450334191322327, + "mean_norm/layer6": 8.556267082691193, + "mean_norm/layer7": 8.733982026576996, + "mean_norm/layer8": 8.878000140190125, + "mean_norm/layer9": 8.860771894454956, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2050 + }, + { + "epoch": 0.86, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43880377865118864, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.9210426807403564, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8044, + "eval_samples_per_second": 20.416, + "eval_steps_per_second": 0.678, + "step": 2050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.88, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9918, + "max_norm": 14.670685768127441, + "max_norm/layer0": 13.415691375732422, + "max_norm/layer1": 13.807945251464844, + "max_norm/layer10": 14.238808631896973, + "max_norm/layer11": 13.896550178527832, + "max_norm/layer12": 14.093559265136719, + "max_norm/layer13": 13.039774894714355, + "max_norm/layer14": 14.146052360534668, + "max_norm/layer15": 14.658995628356934, + "max_norm/layer16": 13.320241928100586, + "max_norm/layer17": 14.467944145202637, + "max_norm/layer18": 13.421971321105957, + "max_norm/layer19": 13.300816535949707, + "max_norm/layer2": 12.368851661682129, + "max_norm/layer20": 14.032940864562988, + "max_norm/layer21": 13.714327812194824, + "max_norm/layer22": 13.763936996459961, + "max_norm/layer23": 14.012027740478516, + "max_norm/layer3": 13.413012504577637, + "max_norm/layer4": 13.571505546569824, + "max_norm/layer5": 14.670685768127441, + "max_norm/layer6": 13.480942726135254, + "max_norm/layer7": 13.977544784545898, + "max_norm/layer8": 14.206221580505371, + "max_norm/layer9": 14.046436309814453, + "mean_norm": 8.915782399475574, + "mean_norm/layer0": 8.628024458885193, + "mean_norm/layer1": 8.685210585594177, + "mean_norm/layer10": 8.902346730232239, + "mean_norm/layer11": 8.993071556091309, + "mean_norm/layer12": 9.100186705589294, + "mean_norm/layer13": 8.842869818210602, + "mean_norm/layer14": 8.988996028900146, + "mean_norm/layer15": 9.087421298027039, + "mean_norm/layer16": 8.86632490158081, + "mean_norm/layer17": 9.047946333885193, + "mean_norm/layer18": 8.881589412689209, + "mean_norm/layer19": 8.886434435844421, + "mean_norm/layer2": 8.321897983551025, + "mean_norm/layer20": 8.96368944644928, + "mean_norm/layer21": 8.934747517108917, + "mean_norm/layer22": 9.241970539093018, + "mean_norm/layer23": 9.237237215042114, + "mean_norm/layer3": 9.074563026428223, + "mean_norm/layer4": 8.737144529819489, + "mean_norm/layer5": 9.476523578166962, + "mean_norm/layer6": 8.56508320569992, + "mean_norm/layer7": 8.74627560377121, + "mean_norm/layer8": 8.893504977226257, + "mean_norm/layer9": 8.87571769952774, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2100 + }, + { + "epoch": 0.88, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.43886867605245333, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.909998893737793, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7897, + "eval_samples_per_second": 20.442, + "eval_steps_per_second": 0.679, + "step": 2100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.9, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9853, + "max_norm": 14.838692665100098, + "max_norm/layer0": 13.50354290008545, + "max_norm/layer1": 13.911642074584961, + "max_norm/layer10": 14.337469100952148, + "max_norm/layer11": 13.996798515319824, + "max_norm/layer12": 14.188272476196289, + "max_norm/layer13": 13.153363227844238, + "max_norm/layer14": 14.2456693649292, + "max_norm/layer15": 14.81822681427002, + "max_norm/layer16": 13.398094177246094, + "max_norm/layer17": 14.58063793182373, + "max_norm/layer18": 13.529489517211914, + "max_norm/layer19": 13.36036491394043, + "max_norm/layer2": 12.395270347595215, + "max_norm/layer20": 14.136859893798828, + "max_norm/layer21": 13.848156929016113, + "max_norm/layer22": 13.873931884765625, + "max_norm/layer23": 14.149714469909668, + "max_norm/layer3": 13.486695289611816, + "max_norm/layer4": 13.675530433654785, + "max_norm/layer5": 14.838692665100098, + "max_norm/layer6": 13.546252250671387, + "max_norm/layer7": 14.067277908325195, + "max_norm/layer8": 14.312942504882812, + "max_norm/layer9": 14.15059757232666, + "mean_norm": 8.9328340391318, + "mean_norm/layer0": 8.638837158679962, + "mean_norm/layer1": 8.69721806049347, + "mean_norm/layer10": 8.91822373867035, + "mean_norm/layer11": 9.010710537433624, + "mean_norm/layer12": 9.121225714683533, + "mean_norm/layer13": 8.85855746269226, + "mean_norm/layer14": 9.007853507995605, + "mean_norm/layer15": 9.107969760894775, + "mean_norm/layer16": 8.883861780166626, + "mean_norm/layer17": 9.06923532485962, + "mean_norm/layer18": 8.90061503648758, + "mean_norm/layer19": 8.905701696872711, + "mean_norm/layer2": 8.326269209384918, + "mean_norm/layer20": 8.983186781406403, + "mean_norm/layer21": 8.953919172286987, + "mean_norm/layer22": 9.268231928348541, + "mean_norm/layer23": 9.26182246208191, + "mean_norm/layer3": 9.09225046634674, + "mean_norm/layer4": 8.748473942279816, + "mean_norm/layer5": 9.502384603023529, + "mean_norm/layer6": 8.573933243751526, + "mean_norm/layer7": 8.758572161197662, + "mean_norm/layer8": 8.908560156822205, + "mean_norm/layer9": 8.890403032302856, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2150 + }, + { + "epoch": 0.9, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4398867540347931, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.901756763458252, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8028, + "eval_samples_per_second": 20.419, + "eval_steps_per_second": 0.678, + "step": 2150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.92, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9923, + "max_norm": 14.992657661437988, + "max_norm/layer0": 13.580909729003906, + "max_norm/layer1": 14.019521713256836, + "max_norm/layer10": 14.454727172851562, + "max_norm/layer11": 14.117258071899414, + "max_norm/layer12": 14.273975372314453, + "max_norm/layer13": 13.259902000427246, + "max_norm/layer14": 14.327220916748047, + "max_norm/layer15": 14.929570198059082, + "max_norm/layer16": 13.4490385055542, + "max_norm/layer17": 14.68906021118164, + "max_norm/layer18": 13.657282829284668, + "max_norm/layer19": 13.454545974731445, + "max_norm/layer2": 12.426871299743652, + "max_norm/layer20": 14.252646446228027, + "max_norm/layer21": 13.96719741821289, + "max_norm/layer22": 14.019536018371582, + "max_norm/layer23": 14.235506057739258, + "max_norm/layer3": 13.598733901977539, + "max_norm/layer4": 13.746255874633789, + "max_norm/layer5": 14.992657661437988, + "max_norm/layer6": 13.630704879760742, + "max_norm/layer7": 14.18418025970459, + "max_norm/layer8": 14.406624794006348, + "max_norm/layer9": 14.30229377746582, + "mean_norm": 8.949172087013721, + "mean_norm/layer0": 8.649221539497375, + "mean_norm/layer1": 8.708901345729828, + "mean_norm/layer10": 8.93329781293869, + "mean_norm/layer11": 9.027457654476166, + "mean_norm/layer12": 9.141777276992798, + "mean_norm/layer13": 8.873935222625732, + "mean_norm/layer14": 9.02572363615036, + "mean_norm/layer15": 9.127559781074524, + "mean_norm/layer16": 8.90040373802185, + "mean_norm/layer17": 9.089453399181366, + "mean_norm/layer18": 8.918771147727966, + "mean_norm/layer19": 8.924110770225525, + "mean_norm/layer2": 8.330630600452423, + "mean_norm/layer20": 9.002286434173584, + "mean_norm/layer21": 8.972177803516388, + "mean_norm/layer22": 9.292498588562012, + "mean_norm/layer23": 9.28546392917633, + "mean_norm/layer3": 9.109552025794983, + "mean_norm/layer4": 8.759545028209686, + "mean_norm/layer5": 9.527128338813782, + "mean_norm/layer6": 8.582504987716675, + "mean_norm/layer7": 8.770052433013916, + "mean_norm/layer8": 8.923248827457428, + "mean_norm/layer9": 8.904427766799927, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2200 + }, + { + "epoch": 0.92, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4405722328356514, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.899564027786255, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7906, + "eval_samples_per_second": 20.44, + "eval_steps_per_second": 0.679, + "step": 2200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.94, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9791, + "max_norm": 15.16025447845459, + "max_norm/layer0": 13.65170955657959, + "max_norm/layer1": 14.106208801269531, + "max_norm/layer10": 14.575181007385254, + "max_norm/layer11": 14.219459533691406, + "max_norm/layer12": 14.364925384521484, + "max_norm/layer13": 13.383106231689453, + "max_norm/layer14": 14.4501314163208, + "max_norm/layer15": 14.990113258361816, + "max_norm/layer16": 13.513087272644043, + "max_norm/layer17": 14.812724113464355, + "max_norm/layer18": 13.795426368713379, + "max_norm/layer19": 13.57463264465332, + "max_norm/layer2": 12.443663597106934, + "max_norm/layer20": 14.366467475891113, + "max_norm/layer21": 14.078028678894043, + "max_norm/layer22": 14.125088691711426, + "max_norm/layer23": 14.330960273742676, + "max_norm/layer3": 13.687296867370605, + "max_norm/layer4": 13.831295013427734, + "max_norm/layer5": 15.16025447845459, + "max_norm/layer6": 13.669600486755371, + "max_norm/layer7": 14.281567573547363, + "max_norm/layer8": 14.49099349975586, + "max_norm/layer9": 14.393123626708984, + "mean_norm": 8.96567795674006, + "mean_norm/layer0": 8.65979665517807, + "mean_norm/layer1": 8.720866560935974, + "mean_norm/layer10": 8.948398649692535, + "mean_norm/layer11": 9.044549465179443, + "mean_norm/layer12": 9.16236698627472, + "mean_norm/layer13": 8.88937371969223, + "mean_norm/layer14": 9.043819427490234, + "mean_norm/layer15": 9.147380352020264, + "mean_norm/layer16": 8.91715395450592, + "mean_norm/layer17": 9.10979026556015, + "mean_norm/layer18": 8.93702483177185, + "mean_norm/layer19": 8.943160235881805, + "mean_norm/layer2": 8.334900140762329, + "mean_norm/layer20": 9.021081447601318, + "mean_norm/layer21": 8.991265833377838, + "mean_norm/layer22": 9.317129492759705, + "mean_norm/layer23": 9.309127569198608, + "mean_norm/layer3": 9.127320051193237, + "mean_norm/layer4": 8.770549535751343, + "mean_norm/layer5": 9.552104949951172, + "mean_norm/layer6": 8.59102463722229, + "mean_norm/layer7": 8.781688511371613, + "mean_norm/layer8": 8.938059091567993, + "mean_norm/layer9": 8.918338596820831, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2250 + }, + { + "epoch": 0.94, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4413428894756696, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.900628089904785, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8107, + "eval_samples_per_second": 20.405, + "eval_steps_per_second": 0.677, + "step": 2250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.96, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9806, + "max_norm": 15.3043851852417, + "max_norm/layer0": 13.725802421569824, + "max_norm/layer1": 14.185372352600098, + "max_norm/layer10": 14.689973831176758, + "max_norm/layer11": 14.349565505981445, + "max_norm/layer12": 14.45600700378418, + "max_norm/layer13": 13.499764442443848, + "max_norm/layer14": 14.550609588623047, + "max_norm/layer15": 15.10234546661377, + "max_norm/layer16": 13.573525428771973, + "max_norm/layer17": 14.938157081604004, + "max_norm/layer18": 13.935149192810059, + "max_norm/layer19": 13.665972709655762, + "max_norm/layer2": 12.481348037719727, + "max_norm/layer20": 14.470271110534668, + "max_norm/layer21": 14.191650390625, + "max_norm/layer22": 14.222891807556152, + "max_norm/layer23": 14.447844505310059, + "max_norm/layer3": 13.801197052001953, + "max_norm/layer4": 13.936980247497559, + "max_norm/layer5": 15.3043851852417, + "max_norm/layer6": 13.723240852355957, + "max_norm/layer7": 14.402823448181152, + "max_norm/layer8": 14.585365295410156, + "max_norm/layer9": 14.490229606628418, + "mean_norm": 8.982164661089579, + "mean_norm/layer0": 8.670240640640259, + "mean_norm/layer1": 8.732674479484558, + "mean_norm/layer10": 8.963507533073425, + "mean_norm/layer11": 9.06149274110794, + "mean_norm/layer12": 9.183135092258453, + "mean_norm/layer13": 8.904652893543243, + "mean_norm/layer14": 9.061905086040497, + "mean_norm/layer15": 9.167264759540558, + "mean_norm/layer16": 8.934041142463684, + "mean_norm/layer17": 9.130063891410828, + "mean_norm/layer18": 8.95542061328888, + "mean_norm/layer19": 8.962070345878601, + "mean_norm/layer2": 8.339269459247589, + "mean_norm/layer20": 9.040118932723999, + "mean_norm/layer21": 9.009513676166534, + "mean_norm/layer22": 9.341909527778625, + "mean_norm/layer23": 9.333087861537933, + "mean_norm/layer3": 9.14510715007782, + "mean_norm/layer4": 8.781482458114624, + "mean_norm/layer5": 9.576900124549866, + "mean_norm/layer6": 8.599566221237183, + "mean_norm/layer7": 8.79344254732132, + "mean_norm/layer8": 8.95266330242157, + "mean_norm/layer9": 8.932421386241913, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2300 + }, + { + "epoch": 0.96, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4420364804516859, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8937957286834717, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7988, + "eval_samples_per_second": 20.426, + "eval_steps_per_second": 0.678, + "step": 2300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 0.98, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9658, + "max_norm": 15.441264152526855, + "max_norm/layer0": 13.801191329956055, + "max_norm/layer1": 14.290616989135742, + "max_norm/layer10": 14.793299674987793, + "max_norm/layer11": 14.459893226623535, + "max_norm/layer12": 14.546797752380371, + "max_norm/layer13": 13.60170841217041, + "max_norm/layer14": 14.642404556274414, + "max_norm/layer15": 15.176553726196289, + "max_norm/layer16": 13.654974937438965, + "max_norm/layer17": 15.051509857177734, + "max_norm/layer18": 14.04863166809082, + "max_norm/layer19": 13.769092559814453, + "max_norm/layer2": 12.504697799682617, + "max_norm/layer20": 14.588030815124512, + "max_norm/layer21": 14.302506446838379, + "max_norm/layer22": 14.334789276123047, + "max_norm/layer23": 14.561293601989746, + "max_norm/layer3": 13.900928497314453, + "max_norm/layer4": 14.038566589355469, + "max_norm/layer5": 15.441264152526855, + "max_norm/layer6": 13.786172866821289, + "max_norm/layer7": 14.514456748962402, + "max_norm/layer8": 14.683159828186035, + "max_norm/layer9": 14.579593658447266, + "mean_norm": 8.998664572834969, + "mean_norm/layer0": 8.680808067321777, + "mean_norm/layer1": 8.744622588157654, + "mean_norm/layer10": 8.978585541248322, + "mean_norm/layer11": 9.078620612621307, + "mean_norm/layer12": 9.203763127326965, + "mean_norm/layer13": 8.91998440027237, + "mean_norm/layer14": 9.07971066236496, + "mean_norm/layer15": 9.186996579170227, + "mean_norm/layer16": 8.95055615901947, + "mean_norm/layer17": 9.15077942609787, + "mean_norm/layer18": 8.973953247070312, + "mean_norm/layer19": 8.980820953845978, + "mean_norm/layer2": 8.34368771314621, + "mean_norm/layer20": 9.059822857379913, + "mean_norm/layer21": 9.02804982662201, + "mean_norm/layer22": 9.366870760917664, + "mean_norm/layer23": 9.357110679149628, + "mean_norm/layer3": 9.162328720092773, + "mean_norm/layer4": 8.792425751686096, + "mean_norm/layer5": 9.601547956466675, + "mean_norm/layer6": 8.608037114143372, + "mean_norm/layer7": 8.804958939552307, + "mean_norm/layer8": 8.967408537864685, + "mean_norm/layer9": 8.946499526500702, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2350 + }, + { + "epoch": 0.98, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44169982518262535, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8900845050811768, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5515, + "eval_samples_per_second": 20.863, + "eval_steps_per_second": 0.693, + "step": 2350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.0, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.9577, + "max_norm": 15.574953079223633, + "max_norm/layer0": 13.878785133361816, + "max_norm/layer1": 14.37764835357666, + "max_norm/layer10": 14.902111053466797, + "max_norm/layer11": 14.557250022888184, + "max_norm/layer12": 14.682308197021484, + "max_norm/layer13": 13.673648834228516, + "max_norm/layer14": 14.743877410888672, + "max_norm/layer15": 15.239487648010254, + "max_norm/layer16": 13.727298736572266, + "max_norm/layer17": 15.168072700500488, + "max_norm/layer18": 14.170589447021484, + "max_norm/layer19": 13.88883113861084, + "max_norm/layer2": 12.54202938079834, + "max_norm/layer20": 14.685086250305176, + "max_norm/layer21": 14.394617080688477, + "max_norm/layer22": 14.45186710357666, + "max_norm/layer23": 14.659900665283203, + "max_norm/layer3": 13.987744331359863, + "max_norm/layer4": 14.10349178314209, + "max_norm/layer5": 15.574953079223633, + "max_norm/layer6": 13.852619171142578, + "max_norm/layer7": 14.626072883605957, + "max_norm/layer8": 14.781867027282715, + "max_norm/layer9": 14.68445110321045, + "mean_norm": 9.014564402401447, + "mean_norm/layer0": 8.691066265106201, + "mean_norm/layer1": 8.756228804588318, + "mean_norm/layer10": 8.993315815925598, + "mean_norm/layer11": 9.095087945461273, + "mean_norm/layer12": 9.223419189453125, + "mean_norm/layer13": 8.934724807739258, + "mean_norm/layer14": 9.097132921218872, + "mean_norm/layer15": 9.206078290939331, + "mean_norm/layer16": 8.96629410982132, + "mean_norm/layer17": 9.170451998710632, + "mean_norm/layer18": 8.991504669189453, + "mean_norm/layer19": 8.998610973358154, + "mean_norm/layer2": 8.347860455513, + "mean_norm/layer20": 9.078348338603973, + "mean_norm/layer21": 9.045956909656525, + "mean_norm/layer22": 9.390547633171082, + "mean_norm/layer23": 9.38027411699295, + "mean_norm/layer3": 9.179291546344757, + "mean_norm/layer4": 8.803498148918152, + "mean_norm/layer5": 9.625588476657867, + "mean_norm/layer6": 8.616418182849884, + "mean_norm/layer7": 8.816068053245544, + "mean_norm/layer8": 8.981455445289612, + "mean_norm/layer9": 8.960322558879852, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2400 + }, + { + "epoch": 1.0, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44255971574938247, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.885669231414795, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5534, + "eval_samples_per_second": 20.86, + "eval_steps_per_second": 0.692, + "step": 2400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.02, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8357, + "max_norm": 15.723752975463867, + "max_norm/layer0": 13.947762489318848, + "max_norm/layer1": 14.477116584777832, + "max_norm/layer10": 15.02506160736084, + "max_norm/layer11": 14.6520414352417, + "max_norm/layer12": 14.819252014160156, + "max_norm/layer13": 13.743169784545898, + "max_norm/layer14": 14.834115982055664, + "max_norm/layer15": 15.359285354614258, + "max_norm/layer16": 13.801314353942871, + "max_norm/layer17": 15.277505874633789, + "max_norm/layer18": 14.275938034057617, + "max_norm/layer19": 14.013418197631836, + "max_norm/layer2": 12.606481552124023, + "max_norm/layer20": 14.789701461791992, + "max_norm/layer21": 14.507436752319336, + "max_norm/layer22": 14.583073616027832, + "max_norm/layer23": 14.75890827178955, + "max_norm/layer3": 14.087556838989258, + "max_norm/layer4": 14.228026390075684, + "max_norm/layer5": 15.723752975463867, + "max_norm/layer6": 13.925374984741211, + "max_norm/layer7": 14.710521697998047, + "max_norm/layer8": 14.911945343017578, + "max_norm/layer9": 14.783496856689453, + "mean_norm": 9.031480019291243, + "mean_norm/layer0": 8.701723158359528, + "mean_norm/layer1": 8.768332779407501, + "mean_norm/layer10": 9.00841349363327, + "mean_norm/layer11": 9.112366914749146, + "mean_norm/layer12": 9.244458794593811, + "mean_norm/layer13": 8.950533390045166, + "mean_norm/layer14": 9.115843534469604, + "mean_norm/layer15": 9.226688921451569, + "mean_norm/layer16": 8.983336091041565, + "mean_norm/layer17": 9.191466331481934, + "mean_norm/layer18": 9.01020735502243, + "mean_norm/layer19": 9.017823576927185, + "mean_norm/layer2": 8.352315068244934, + "mean_norm/layer20": 9.098797261714935, + "mean_norm/layer21": 9.06588214635849, + "mean_norm/layer22": 9.41590791940689, + "mean_norm/layer23": 9.405222654342651, + "mean_norm/layer3": 9.196974635124207, + "mean_norm/layer4": 8.814748108386993, + "mean_norm/layer5": 9.65069442987442, + "mean_norm/layer6": 8.625239789485931, + "mean_norm/layer7": 8.827593207359314, + "mean_norm/layer8": 8.996190905570984, + "mean_norm/layer9": 8.974759995937347, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2450 + }, + { + "epoch": 1.02, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44219061177968955, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.891197443008423, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7944, + "eval_samples_per_second": 20.433, + "eval_steps_per_second": 0.678, + "step": 2450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.04, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8427, + "max_norm": 15.870335578918457, + "max_norm/layer0": 14.013547897338867, + "max_norm/layer1": 14.573381423950195, + "max_norm/layer10": 15.130743026733398, + "max_norm/layer11": 14.750649452209473, + "max_norm/layer12": 14.940457344055176, + "max_norm/layer13": 13.85982894897461, + "max_norm/layer14": 14.928179740905762, + "max_norm/layer15": 15.517732620239258, + "max_norm/layer16": 13.898526191711426, + "max_norm/layer17": 15.39119815826416, + "max_norm/layer18": 14.368980407714844, + "max_norm/layer19": 14.072687149047852, + "max_norm/layer2": 12.69582748413086, + "max_norm/layer20": 14.895695686340332, + "max_norm/layer21": 14.618597030639648, + "max_norm/layer22": 14.678531646728516, + "max_norm/layer23": 14.874917030334473, + "max_norm/layer3": 14.15068244934082, + "max_norm/layer4": 14.324492454528809, + "max_norm/layer5": 15.870335578918457, + "max_norm/layer6": 13.982853889465332, + "max_norm/layer7": 14.777878761291504, + "max_norm/layer8": 15.033072471618652, + "max_norm/layer9": 14.886922836303711, + "mean_norm": 9.048154046138128, + "mean_norm/layer0": 8.712783455848694, + "mean_norm/layer1": 8.780392825603485, + "mean_norm/layer10": 9.02328896522522, + "mean_norm/layer11": 9.129519879817963, + "mean_norm/layer12": 9.265049755573273, + "mean_norm/layer13": 8.966003775596619, + "mean_norm/layer14": 9.13392037153244, + "mean_norm/layer15": 9.246784627437592, + "mean_norm/layer16": 8.9999498128891, + "mean_norm/layer17": 9.212452232837677, + "mean_norm/layer18": 9.028715074062347, + "mean_norm/layer19": 9.0364351272583, + "mean_norm/layer2": 8.356776595115662, + "mean_norm/layer20": 9.11862301826477, + "mean_norm/layer21": 9.0850949883461, + "mean_norm/layer22": 9.4408740401268, + "mean_norm/layer23": 9.429868519306183, + "mean_norm/layer3": 9.214716017246246, + "mean_norm/layer4": 8.826160609722137, + "mean_norm/layer5": 9.675524532794952, + "mean_norm/layer6": 8.633809804916382, + "mean_norm/layer7": 8.83916038274765, + "mean_norm/layer8": 9.010636866092682, + "mean_norm/layer9": 8.98915582895279, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2500 + }, + { + "epoch": 1.04, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4415984229931493, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8902156352996826, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8087, + "eval_samples_per_second": 20.409, + "eval_steps_per_second": 0.677, + "step": 2500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.06, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8524, + "max_norm": 16.009868621826172, + "max_norm/layer0": 14.078265190124512, + "max_norm/layer1": 14.670526504516602, + "max_norm/layer10": 15.227030754089355, + "max_norm/layer11": 14.859092712402344, + "max_norm/layer12": 15.091114044189453, + "max_norm/layer13": 13.921088218688965, + "max_norm/layer14": 15.035015106201172, + "max_norm/layer15": 15.675447463989258, + "max_norm/layer16": 14.004446983337402, + "max_norm/layer17": 15.502359390258789, + "max_norm/layer18": 14.5051851272583, + "max_norm/layer19": 14.167274475097656, + "max_norm/layer2": 12.767056465148926, + "max_norm/layer20": 15.009303092956543, + "max_norm/layer21": 14.740386009216309, + "max_norm/layer22": 14.763566970825195, + "max_norm/layer23": 14.968628883361816, + "max_norm/layer3": 14.237839698791504, + "max_norm/layer4": 14.436867713928223, + "max_norm/layer5": 16.009868621826172, + "max_norm/layer6": 14.039834022521973, + "max_norm/layer7": 14.868507385253906, + "max_norm/layer8": 15.15004825592041, + "max_norm/layer9": 14.995036125183105, + "mean_norm": 9.064850961168608, + "mean_norm/layer0": 8.724150776863098, + "mean_norm/layer1": 8.792477667331696, + "mean_norm/layer10": 9.038262903690338, + "mean_norm/layer11": 9.146433353424072, + "mean_norm/layer12": 9.2858447432518, + "mean_norm/layer13": 8.981484949588776, + "mean_norm/layer14": 9.152089536190033, + "mean_norm/layer15": 9.266744434833527, + "mean_norm/layer16": 9.016795575618744, + "mean_norm/layer17": 9.233408987522125, + "mean_norm/layer18": 9.046853363513947, + "mean_norm/layer19": 9.05537211894989, + "mean_norm/layer2": 8.361333727836609, + "mean_norm/layer20": 9.13805490732193, + "mean_norm/layer21": 9.10432755947113, + "mean_norm/layer22": 9.466131627559662, + "mean_norm/layer23": 9.454012274742126, + "mean_norm/layer3": 9.232695639133453, + "mean_norm/layer4": 8.837390780448914, + "mean_norm/layer5": 9.700556099414825, + "mean_norm/layer6": 8.642646074295044, + "mean_norm/layer7": 8.850711584091187, + "mean_norm/layer8": 9.025233507156372, + "mean_norm/layer9": 9.003410875797272, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2550 + }, + { + "epoch": 1.06, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4432127458496084, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.883772850036621, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.774, + "eval_samples_per_second": 20.469, + "eval_steps_per_second": 0.679, + "step": 2550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.09, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8441, + "max_norm": 16.144901275634766, + "max_norm/layer0": 14.166998863220215, + "max_norm/layer1": 14.77054500579834, + "max_norm/layer10": 15.321858406066895, + "max_norm/layer11": 14.944963455200195, + "max_norm/layer12": 15.217597007751465, + "max_norm/layer13": 13.982170104980469, + "max_norm/layer14": 15.154606819152832, + "max_norm/layer15": 15.824800491333008, + "max_norm/layer16": 14.139287948608398, + "max_norm/layer17": 15.600570678710938, + "max_norm/layer18": 14.64634895324707, + "max_norm/layer19": 14.26150894165039, + "max_norm/layer2": 12.838845252990723, + "max_norm/layer20": 15.12016487121582, + "max_norm/layer21": 14.849102973937988, + "max_norm/layer22": 14.883748054504395, + "max_norm/layer23": 15.04641342163086, + "max_norm/layer3": 14.34477710723877, + "max_norm/layer4": 14.549644470214844, + "max_norm/layer5": 16.144901275634766, + "max_norm/layer6": 14.10580062866211, + "max_norm/layer7": 14.937480926513672, + "max_norm/layer8": 15.275439262390137, + "max_norm/layer9": 15.114044189453125, + "mean_norm": 9.081460249920687, + "mean_norm/layer0": 8.735827803611755, + "mean_norm/layer1": 8.804422497749329, + "mean_norm/layer10": 9.052965462207794, + "mean_norm/layer11": 9.16351443529129, + "mean_norm/layer12": 9.306387066841125, + "mean_norm/layer13": 8.996783316135406, + "mean_norm/layer14": 9.170424222946167, + "mean_norm/layer15": 9.286848545074463, + "mean_norm/layer16": 9.033456265926361, + "mean_norm/layer17": 9.253972351551056, + "mean_norm/layer18": 9.065014839172363, + "mean_norm/layer19": 9.074174404144287, + "mean_norm/layer2": 8.366111278533936, + "mean_norm/layer20": 9.157218277454376, + "mean_norm/layer21": 9.12339198589325, + "mean_norm/layer22": 9.491381049156189, + "mean_norm/layer23": 9.47799527645111, + "mean_norm/layer3": 9.250598967075348, + "mean_norm/layer4": 8.848586916923523, + "mean_norm/layer5": 9.725355744361877, + "mean_norm/layer6": 8.651413083076477, + "mean_norm/layer7": 8.862074136734009, + "mean_norm/layer8": 9.039798736572266, + "mean_norm/layer9": 9.017329335212708, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2600 + }, + { + "epoch": 1.09, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4437805981106744, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8798539638519287, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7931, + "eval_samples_per_second": 20.436, + "eval_steps_per_second": 0.678, + "step": 2600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.11, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8597, + "max_norm": 16.280908584594727, + "max_norm/layer0": 14.25904369354248, + "max_norm/layer1": 14.876733779907227, + "max_norm/layer10": 15.432615280151367, + "max_norm/layer11": 15.070473670959473, + "max_norm/layer12": 15.340192794799805, + "max_norm/layer13": 14.053213119506836, + "max_norm/layer14": 15.254984855651855, + "max_norm/layer15": 15.967584609985352, + "max_norm/layer16": 14.240683555603027, + "max_norm/layer17": 15.71219253540039, + "max_norm/layer18": 14.776082992553711, + "max_norm/layer19": 14.346572875976562, + "max_norm/layer2": 12.922161102294922, + "max_norm/layer20": 15.224787712097168, + "max_norm/layer21": 14.95941162109375, + "max_norm/layer22": 15.001152038574219, + "max_norm/layer23": 15.122055053710938, + "max_norm/layer3": 14.454421997070312, + "max_norm/layer4": 14.653867721557617, + "max_norm/layer5": 16.280908584594727, + "max_norm/layer6": 14.169611930847168, + "max_norm/layer7": 15.036980628967285, + "max_norm/layer8": 15.427152633666992, + "max_norm/layer9": 15.218523025512695, + "mean_norm": 9.097782894968987, + "mean_norm/layer0": 8.747545421123505, + "mean_norm/layer1": 8.816453874111176, + "mean_norm/layer10": 9.067423224449158, + "mean_norm/layer11": 9.180491149425507, + "mean_norm/layer12": 9.326535284519196, + "mean_norm/layer13": 9.011679291725159, + "mean_norm/layer14": 9.18821370601654, + "mean_norm/layer15": 9.306611061096191, + "mean_norm/layer16": 9.050126194953918, + "mean_norm/layer17": 9.274332463741302, + "mean_norm/layer18": 9.083183467388153, + "mean_norm/layer19": 9.092769265174866, + "mean_norm/layer2": 8.370811522006989, + "mean_norm/layer20": 9.176023662090302, + "mean_norm/layer21": 9.141830861568451, + "mean_norm/layer22": 9.516046524047852, + "mean_norm/layer23": 9.501545190811157, + "mean_norm/layer3": 9.268109500408173, + "mean_norm/layer4": 8.859676361083984, + "mean_norm/layer5": 9.749540209770203, + "mean_norm/layer6": 8.65969580411911, + "mean_norm/layer7": 8.873176157474518, + "mean_norm/layer8": 9.053912878036499, + "mean_norm/layer9": 9.03105640411377, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2650 + }, + { + "epoch": 1.11, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4426530057637004, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.882810115814209, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7841, + "eval_samples_per_second": 20.451, + "eval_steps_per_second": 0.679, + "step": 2650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.13, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8523, + "max_norm": 16.419876098632812, + "max_norm/layer0": 14.34637451171875, + "max_norm/layer1": 14.984748840332031, + "max_norm/layer10": 15.536199569702148, + "max_norm/layer11": 15.177663803100586, + "max_norm/layer12": 15.445916175842285, + "max_norm/layer13": 14.101208686828613, + "max_norm/layer14": 15.343002319335938, + "max_norm/layer15": 16.075366973876953, + "max_norm/layer16": 14.350403785705566, + "max_norm/layer17": 15.8396577835083, + "max_norm/layer18": 14.874992370605469, + "max_norm/layer19": 14.431367874145508, + "max_norm/layer2": 13.012994766235352, + "max_norm/layer20": 15.345575332641602, + "max_norm/layer21": 15.066669464111328, + "max_norm/layer22": 15.1093111038208, + "max_norm/layer23": 15.202255249023438, + "max_norm/layer3": 14.54269790649414, + "max_norm/layer4": 14.769430160522461, + "max_norm/layer5": 16.419876098632812, + "max_norm/layer6": 14.223309516906738, + "max_norm/layer7": 15.136229515075684, + "max_norm/layer8": 15.555449485778809, + "max_norm/layer9": 15.360017776489258, + "mean_norm": 9.113588072359562, + "mean_norm/layer0": 8.759117603302002, + "mean_norm/layer1": 8.828328490257263, + "mean_norm/layer10": 9.081544935703278, + "mean_norm/layer11": 9.196539223194122, + "mean_norm/layer12": 9.34596437215805, + "mean_norm/layer13": 9.026325702667236, + "mean_norm/layer14": 9.20580768585205, + "mean_norm/layer15": 9.325709998607635, + "mean_norm/layer16": 9.066176950931549, + "mean_norm/layer17": 9.293815612792969, + "mean_norm/layer18": 9.100383222103119, + "mean_norm/layer19": 9.110606670379639, + "mean_norm/layer2": 8.375436842441559, + "mean_norm/layer20": 9.194181025028229, + "mean_norm/layer21": 9.159276247024536, + "mean_norm/layer22": 9.539666295051575, + "mean_norm/layer23": 9.524423122406006, + "mean_norm/layer3": 9.285327970981598, + "mean_norm/layer4": 8.870383977890015, + "mean_norm/layer5": 9.77319449186325, + "mean_norm/layer6": 8.667758345603943, + "mean_norm/layer7": 8.884088516235352, + "mean_norm/layer8": 9.067574143409729, + "mean_norm/layer9": 9.044482290744781, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2700 + }, + { + "epoch": 1.13, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.443082951047079, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.877031087875366, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8014, + "eval_samples_per_second": 20.421, + "eval_steps_per_second": 0.678, + "step": 2700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.15, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8622, + "max_norm": 16.557350158691406, + "max_norm/layer0": 14.418149948120117, + "max_norm/layer1": 15.097500801086426, + "max_norm/layer10": 15.643484115600586, + "max_norm/layer11": 15.281368255615234, + "max_norm/layer12": 15.568787574768066, + "max_norm/layer13": 14.152594566345215, + "max_norm/layer14": 15.426847457885742, + "max_norm/layer15": 16.16790199279785, + "max_norm/layer16": 14.4529447555542, + "max_norm/layer17": 15.965700149536133, + "max_norm/layer18": 15.009598731994629, + "max_norm/layer19": 14.541038513183594, + "max_norm/layer2": 13.10386848449707, + "max_norm/layer20": 15.445903778076172, + "max_norm/layer21": 15.171789169311523, + "max_norm/layer22": 15.222389221191406, + "max_norm/layer23": 15.312973976135254, + "max_norm/layer3": 14.611842155456543, + "max_norm/layer4": 14.887364387512207, + "max_norm/layer5": 16.557350158691406, + "max_norm/layer6": 14.284734725952148, + "max_norm/layer7": 15.256564140319824, + "max_norm/layer8": 15.690933227539062, + "max_norm/layer9": 15.485148429870605, + "mean_norm": 9.129469233254591, + "mean_norm/layer0": 8.77081549167633, + "mean_norm/layer1": 8.84003496170044, + "mean_norm/layer10": 9.095685243606567, + "mean_norm/layer11": 9.2125763297081, + "mean_norm/layer12": 9.365703403949738, + "mean_norm/layer13": 9.041068434715271, + "mean_norm/layer14": 9.223137736320496, + "mean_norm/layer15": 9.344794929027557, + "mean_norm/layer16": 9.082189679145813, + "mean_norm/layer17": 9.313395082950592, + "mean_norm/layer18": 9.11777526140213, + "mean_norm/layer19": 9.128398835659027, + "mean_norm/layer2": 8.379985272884369, + "mean_norm/layer20": 9.213001072406769, + "mean_norm/layer21": 9.177213549613953, + "mean_norm/layer22": 9.56313019990921, + "mean_norm/layer23": 9.547671377658844, + "mean_norm/layer3": 9.302635192871094, + "mean_norm/layer4": 8.881201982498169, + "mean_norm/layer5": 9.797004163265228, + "mean_norm/layer6": 8.67586863040924, + "mean_norm/layer7": 8.894869089126587, + "mean_norm/layer8": 9.081298410892487, + "mean_norm/layer9": 9.057807266712189, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2750 + }, + { + "epoch": 1.15, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4445593669258507, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8714001178741455, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7901, + "eval_samples_per_second": 20.441, + "eval_steps_per_second": 0.679, + "step": 2750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.17, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.864, + "max_norm": 16.692607879638672, + "max_norm/layer0": 14.486806869506836, + "max_norm/layer1": 15.20768928527832, + "max_norm/layer10": 15.750007629394531, + "max_norm/layer11": 15.358442306518555, + "max_norm/layer12": 15.6708984375, + "max_norm/layer13": 14.241842269897461, + "max_norm/layer14": 15.518338203430176, + "max_norm/layer15": 16.292762756347656, + "max_norm/layer16": 14.54626750946045, + "max_norm/layer17": 16.069358825683594, + "max_norm/layer18": 15.13725757598877, + "max_norm/layer19": 14.667492866516113, + "max_norm/layer2": 13.187070846557617, + "max_norm/layer20": 15.576197624206543, + "max_norm/layer21": 15.274862289428711, + "max_norm/layer22": 15.325810432434082, + "max_norm/layer23": 15.413392066955566, + "max_norm/layer3": 14.685466766357422, + "max_norm/layer4": 14.984869003295898, + "max_norm/layer5": 16.692607879638672, + "max_norm/layer6": 14.32935619354248, + "max_norm/layer7": 15.362448692321777, + "max_norm/layer8": 15.82071304321289, + "max_norm/layer9": 15.565882682800293, + "mean_norm": 9.145023641486963, + "mean_norm/layer0": 8.78237795829773, + "mean_norm/layer1": 8.851688504219055, + "mean_norm/layer10": 9.109631359577179, + "mean_norm/layer11": 9.228287041187286, + "mean_norm/layer12": 9.385038435459137, + "mean_norm/layer13": 9.055398046970367, + "mean_norm/layer14": 9.239995121955872, + "mean_norm/layer15": 9.363190233707428, + "mean_norm/layer16": 9.097616195678711, + "mean_norm/layer17": 9.332431018352509, + "mean_norm/layer18": 9.135051906108856, + "mean_norm/layer19": 9.145816683769226, + "mean_norm/layer2": 8.38431704044342, + "mean_norm/layer20": 9.23117482662201, + "mean_norm/layer21": 9.19452828168869, + "mean_norm/layer22": 9.586361765861511, + "mean_norm/layer23": 9.570209264755249, + "mean_norm/layer3": 9.319473028182983, + "mean_norm/layer4": 8.891644835472107, + "mean_norm/layer5": 9.820540606975555, + "mean_norm/layer6": 8.68411499261856, + "mean_norm/layer7": 8.905657947063446, + "mean_norm/layer8": 9.094788134098053, + "mean_norm/layer9": 9.071234166622162, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2800 + }, + { + "epoch": 1.17, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4445796473637459, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.873532295227051, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8068, + "eval_samples_per_second": 20.412, + "eval_steps_per_second": 0.678, + "step": 2800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.19, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8527, + "max_norm": 16.828922271728516, + "max_norm/layer0": 14.584033012390137, + "max_norm/layer1": 15.336833000183105, + "max_norm/layer10": 15.875840187072754, + "max_norm/layer11": 15.442821502685547, + "max_norm/layer12": 15.754557609558105, + "max_norm/layer13": 14.32339096069336, + "max_norm/layer14": 15.597060203552246, + "max_norm/layer15": 16.412872314453125, + "max_norm/layer16": 14.650659561157227, + "max_norm/layer17": 16.20420265197754, + "max_norm/layer18": 15.219154357910156, + "max_norm/layer19": 14.83084774017334, + "max_norm/layer2": 13.268367767333984, + "max_norm/layer20": 15.677299499511719, + "max_norm/layer21": 15.406458854675293, + "max_norm/layer22": 15.44321060180664, + "max_norm/layer23": 15.511178016662598, + "max_norm/layer3": 14.764835357666016, + "max_norm/layer4": 15.09919548034668, + "max_norm/layer5": 16.828922271728516, + "max_norm/layer6": 14.383938789367676, + "max_norm/layer7": 15.485296249389648, + "max_norm/layer8": 15.941476821899414, + "max_norm/layer9": 15.665557861328125, + "mean_norm": 9.160597927868366, + "mean_norm/layer0": 8.794089376926422, + "mean_norm/layer1": 8.863369762897491, + "mean_norm/layer10": 9.12364000082016, + "mean_norm/layer11": 9.244284212589264, + "mean_norm/layer12": 9.404542028903961, + "mean_norm/layer13": 9.069941818714142, + "mean_norm/layer14": 9.256960809230804, + "mean_norm/layer15": 9.381789445877075, + "mean_norm/layer16": 9.113153159618378, + "mean_norm/layer17": 9.35132884979248, + "mean_norm/layer18": 9.151803016662598, + "mean_norm/layer19": 9.163000464439392, + "mean_norm/layer2": 8.388769388198853, + "mean_norm/layer20": 9.248739957809448, + "mean_norm/layer21": 9.21191132068634, + "mean_norm/layer22": 9.609494626522064, + "mean_norm/layer23": 9.593034207820892, + "mean_norm/layer3": 9.33625191450119, + "mean_norm/layer4": 8.902081072330475, + "mean_norm/layer5": 9.844298720359802, + "mean_norm/layer6": 8.692344605922699, + "mean_norm/layer7": 8.916409969329834, + "mean_norm/layer8": 9.108461380004883, + "mean_norm/layer9": 9.084650158882141, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2850 + }, + { + "epoch": 1.19, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44370758853425163, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8756139278411865, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8326, + "eval_samples_per_second": 20.368, + "eval_steps_per_second": 0.676, + "step": 2850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.21, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8409, + "max_norm": 16.954225540161133, + "max_norm/layer0": 14.67629623413086, + "max_norm/layer1": 15.439681053161621, + "max_norm/layer10": 15.993009567260742, + "max_norm/layer11": 15.52728271484375, + "max_norm/layer12": 15.852997779846191, + "max_norm/layer13": 14.400331497192383, + "max_norm/layer14": 15.702228546142578, + "max_norm/layer15": 16.554004669189453, + "max_norm/layer16": 14.767534255981445, + "max_norm/layer17": 16.32081413269043, + "max_norm/layer18": 15.322539329528809, + "max_norm/layer19": 14.932204246520996, + "max_norm/layer2": 13.33304214477539, + "max_norm/layer20": 15.784565925598145, + "max_norm/layer21": 15.512778282165527, + "max_norm/layer22": 15.573765754699707, + "max_norm/layer23": 15.618204116821289, + "max_norm/layer3": 14.863533973693848, + "max_norm/layer4": 15.184027671813965, + "max_norm/layer5": 16.954225540161133, + "max_norm/layer6": 14.433019638061523, + "max_norm/layer7": 15.593091011047363, + "max_norm/layer8": 16.040678024291992, + "max_norm/layer9": 15.799813270568848, + "mean_norm": 9.175687476992607, + "mean_norm/layer0": 8.805468738079071, + "mean_norm/layer1": 8.874761521816254, + "mean_norm/layer10": 9.137395858764648, + "mean_norm/layer11": 9.259815275669098, + "mean_norm/layer12": 9.423438429832458, + "mean_norm/layer13": 9.08407998085022, + "mean_norm/layer14": 9.273297250270844, + "mean_norm/layer15": 9.399744391441345, + "mean_norm/layer16": 9.12816721200943, + "mean_norm/layer17": 9.369861721992493, + "mean_norm/layer18": 9.168180584907532, + "mean_norm/layer19": 9.179289519786835, + "mean_norm/layer2": 8.39303857088089, + "mean_norm/layer20": 9.265758633613586, + "mean_norm/layer21": 9.228505730628967, + "mean_norm/layer22": 9.631839513778687, + "mean_norm/layer23": 9.615257382392883, + "mean_norm/layer3": 9.35254430770874, + "mean_norm/layer4": 8.912357032299042, + "mean_norm/layer5": 9.867339313030243, + "mean_norm/layer6": 8.700405836105347, + "mean_norm/layer7": 8.926807165145874, + "mean_norm/layer8": 9.121643006801605, + "mean_norm/layer9": 9.09750247001648, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2900 + }, + { + "epoch": 1.21, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44484329305638365, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8662402629852295, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5382, + "eval_samples_per_second": 20.887, + "eval_steps_per_second": 0.693, + "step": 2900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.23, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8535, + "max_norm": 17.074094772338867, + "max_norm/layer0": 14.771538734436035, + "max_norm/layer1": 15.542774200439453, + "max_norm/layer10": 16.1263370513916, + "max_norm/layer11": 15.602151870727539, + "max_norm/layer12": 15.966864585876465, + "max_norm/layer13": 14.503449440002441, + "max_norm/layer14": 15.782112121582031, + "max_norm/layer15": 16.67736053466797, + "max_norm/layer16": 14.884428977966309, + "max_norm/layer17": 16.445512771606445, + "max_norm/layer18": 15.415112495422363, + "max_norm/layer19": 15.022063255310059, + "max_norm/layer2": 13.403141021728516, + "max_norm/layer20": 15.920245170593262, + "max_norm/layer21": 15.62589168548584, + "max_norm/layer22": 15.720357894897461, + "max_norm/layer23": 15.716158866882324, + "max_norm/layer3": 14.941350936889648, + "max_norm/layer4": 15.257119178771973, + "max_norm/layer5": 17.074094772338867, + "max_norm/layer6": 14.491571426391602, + "max_norm/layer7": 15.718575477600098, + "max_norm/layer8": 16.172351837158203, + "max_norm/layer9": 15.940131187438965, + "mean_norm": 9.190696770946184, + "mean_norm/layer0": 8.816956281661987, + "mean_norm/layer1": 8.88613373041153, + "mean_norm/layer10": 9.150634229183197, + "mean_norm/layer11": 9.275252103805542, + "mean_norm/layer12": 9.442244589328766, + "mean_norm/layer13": 9.098045706748962, + "mean_norm/layer14": 9.289654433727264, + "mean_norm/layer15": 9.417704820632935, + "mean_norm/layer16": 9.143186032772064, + "mean_norm/layer17": 9.388283371925354, + "mean_norm/layer18": 9.184568285942078, + "mean_norm/layer19": 9.19563889503479, + "mean_norm/layer2": 8.397359848022461, + "mean_norm/layer20": 9.282590985298157, + "mean_norm/layer21": 9.245154798030853, + "mean_norm/layer22": 9.65415096282959, + "mean_norm/layer23": 9.63697373867035, + "mean_norm/layer3": 9.368990659713745, + "mean_norm/layer4": 8.922351777553558, + "mean_norm/layer5": 9.89015644788742, + "mean_norm/layer6": 8.708074033260345, + "mean_norm/layer7": 8.937257945537567, + "mean_norm/layer8": 9.134815633296967, + "mean_norm/layer9": 9.110543191432953, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 2950 + }, + { + "epoch": 1.23, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4459871097536738, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8599984645843506, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7959, + "eval_samples_per_second": 20.431, + "eval_steps_per_second": 0.678, + "step": 2950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.25, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8447, + "max_norm": 17.19088363647461, + "max_norm/layer0": 14.864973068237305, + "max_norm/layer1": 15.62208080291748, + "max_norm/layer10": 16.26564598083496, + "max_norm/layer11": 15.690491676330566, + "max_norm/layer12": 16.09348487854004, + "max_norm/layer13": 14.608466148376465, + "max_norm/layer14": 15.872156143188477, + "max_norm/layer15": 16.789859771728516, + "max_norm/layer16": 14.985624313354492, + "max_norm/layer17": 16.59108543395996, + "max_norm/layer18": 15.49613094329834, + "max_norm/layer19": 15.138503074645996, + "max_norm/layer2": 13.480121612548828, + "max_norm/layer20": 16.039661407470703, + "max_norm/layer21": 15.726054191589355, + "max_norm/layer22": 15.85644245147705, + "max_norm/layer23": 15.822321891784668, + "max_norm/layer3": 15.016472816467285, + "max_norm/layer4": 15.327754020690918, + "max_norm/layer5": 17.19088363647461, + "max_norm/layer6": 14.556528091430664, + "max_norm/layer7": 15.827574729919434, + "max_norm/layer8": 16.28036880493164, + "max_norm/layer9": 16.034198760986328, + "mean_norm": 9.205305655797323, + "mean_norm/layer0": 8.828269600868225, + "mean_norm/layer1": 8.897296965122223, + "mean_norm/layer10": 9.163637578487396, + "mean_norm/layer11": 9.2901731133461, + "mean_norm/layer12": 9.460385203361511, + "mean_norm/layer13": 9.11164516210556, + "mean_norm/layer14": 9.305707812309265, + "mean_norm/layer15": 9.43520051240921, + "mean_norm/layer16": 9.157863140106201, + "mean_norm/layer17": 9.406088531017303, + "mean_norm/layer18": 9.200478971004486, + "mean_norm/layer19": 9.211331129074097, + "mean_norm/layer2": 8.401508867740631, + "mean_norm/layer20": 9.298927962779999, + "mean_norm/layer21": 9.261110067367554, + "mean_norm/layer22": 9.6760755777359, + "mean_norm/layer23": 9.658278584480286, + "mean_norm/layer3": 9.3849378824234, + "mean_norm/layer4": 8.932135999202728, + "mean_norm/layer5": 9.912546157836914, + "mean_norm/layer6": 8.71561086177826, + "mean_norm/layer7": 8.947454273700714, + "mean_norm/layer8": 9.147588908672333, + "mean_norm/layer9": 9.123082876205444, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3000 + }, + { + "epoch": 1.25, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4469808512105393, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8544092178344727, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8166, + "eval_samples_per_second": 20.395, + "eval_steps_per_second": 0.677, + "step": 3000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.27, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8494, + "max_norm": 17.332006454467773, + "max_norm/layer0": 14.971895217895508, + "max_norm/layer1": 15.706180572509766, + "max_norm/layer10": 16.39055633544922, + "max_norm/layer11": 15.820825576782227, + "max_norm/layer12": 16.230440139770508, + "max_norm/layer13": 14.713774681091309, + "max_norm/layer14": 15.964306831359863, + "max_norm/layer15": 16.913372039794922, + "max_norm/layer16": 15.084409713745117, + "max_norm/layer17": 16.690601348876953, + "max_norm/layer18": 15.592001914978027, + "max_norm/layer19": 15.248854637145996, + "max_norm/layer2": 13.564947128295898, + "max_norm/layer20": 16.140636444091797, + "max_norm/layer21": 15.825383186340332, + "max_norm/layer22": 15.98045825958252, + "max_norm/layer23": 15.944609642028809, + "max_norm/layer3": 15.109355926513672, + "max_norm/layer4": 15.39990234375, + "max_norm/layer5": 17.332006454467773, + "max_norm/layer6": 14.59697437286377, + "max_norm/layer7": 15.948881149291992, + "max_norm/layer8": 16.376832962036133, + "max_norm/layer9": 16.13812828063965, + "mean_norm": 9.220104138056437, + "mean_norm/layer0": 8.839670896530151, + "mean_norm/layer1": 8.908665537834167, + "mean_norm/layer10": 9.176793336868286, + "mean_norm/layer11": 9.305428922176361, + "mean_norm/layer12": 9.478922605514526, + "mean_norm/layer13": 9.125423610210419, + "mean_norm/layer14": 9.321944952011108, + "mean_norm/layer15": 9.452899932861328, + "mean_norm/layer16": 9.172569692134857, + "mean_norm/layer17": 9.424022793769836, + "mean_norm/layer18": 9.216603875160217, + "mean_norm/layer19": 9.227488934993744, + "mean_norm/layer2": 8.40572214126587, + "mean_norm/layer20": 9.315212488174438, + "mean_norm/layer21": 9.277587234973907, + "mean_norm/layer22": 9.698153376579285, + "mean_norm/layer23": 9.679868876934052, + "mean_norm/layer3": 9.401076316833496, + "mean_norm/layer4": 8.941973567008972, + "mean_norm/layer5": 9.935079276561737, + "mean_norm/layer6": 8.72326409816742, + "mean_norm/layer7": 8.957727432250977, + "mean_norm/layer8": 9.160670280456543, + "mean_norm/layer9": 9.135729134082794, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3050 + }, + { + "epoch": 1.27, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44626292370904874, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8586294651031494, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8056, + "eval_samples_per_second": 20.414, + "eval_steps_per_second": 0.678, + "step": 3050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.29, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.851, + "max_norm": 17.45079231262207, + "max_norm/layer0": 15.07141399383545, + "max_norm/layer1": 15.788281440734863, + "max_norm/layer10": 16.522247314453125, + "max_norm/layer11": 15.996971130371094, + "max_norm/layer12": 16.32065200805664, + "max_norm/layer13": 14.813121795654297, + "max_norm/layer14": 16.042503356933594, + "max_norm/layer15": 17.024852752685547, + "max_norm/layer16": 15.163915634155273, + "max_norm/layer17": 16.79519271850586, + "max_norm/layer18": 15.687070846557617, + "max_norm/layer19": 15.342894554138184, + "max_norm/layer2": 13.622076034545898, + "max_norm/layer20": 16.25835418701172, + "max_norm/layer21": 15.937350273132324, + "max_norm/layer22": 16.101654052734375, + "max_norm/layer23": 16.047069549560547, + "max_norm/layer3": 15.202547073364258, + "max_norm/layer4": 15.467806816101074, + "max_norm/layer5": 17.45079231262207, + "max_norm/layer6": 14.651065826416016, + "max_norm/layer7": 16.03363609313965, + "max_norm/layer8": 16.475841522216797, + "max_norm/layer9": 16.232484817504883, + "mean_norm": 9.234526852766672, + "mean_norm/layer0": 8.850844144821167, + "mean_norm/layer1": 8.919748723506927, + "mean_norm/layer10": 9.189667701721191, + "mean_norm/layer11": 9.320032119750977, + "mean_norm/layer12": 9.49708503484726, + "mean_norm/layer13": 9.138881921768188, + "mean_norm/layer14": 9.337770938873291, + "mean_norm/layer15": 9.47018826007843, + "mean_norm/layer16": 9.186775863170624, + "mean_norm/layer17": 9.441416263580322, + "mean_norm/layer18": 9.232204139232635, + "mean_norm/layer19": 9.243465781211853, + "mean_norm/layer2": 8.40979117155075, + "mean_norm/layer20": 9.331261694431305, + "mean_norm/layer21": 9.293141663074493, + "mean_norm/layer22": 9.719446420669556, + "mean_norm/layer23": 9.700763463973999, + "mean_norm/layer3": 9.41711300611496, + "mean_norm/layer4": 8.95202124118805, + "mean_norm/layer5": 9.957186877727509, + "mean_norm/layer6": 8.730644345283508, + "mean_norm/layer7": 8.96764749288559, + "mean_norm/layer8": 9.17331349849701, + "mean_norm/layer9": 9.148232698440552, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3100 + }, + { + "epoch": 1.29, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44737429170570653, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8489952087402344, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5802, + "eval_samples_per_second": 20.811, + "eval_steps_per_second": 0.691, + "step": 3100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.32, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8352, + "max_norm": 17.570619583129883, + "max_norm/layer0": 15.160906791687012, + "max_norm/layer1": 15.87808609008789, + "max_norm/layer10": 16.663211822509766, + "max_norm/layer11": 16.07549285888672, + "max_norm/layer12": 16.4635066986084, + "max_norm/layer13": 14.898290634155273, + "max_norm/layer14": 16.140918731689453, + "max_norm/layer15": 17.153202056884766, + "max_norm/layer16": 15.241742134094238, + "max_norm/layer17": 16.903993606567383, + "max_norm/layer18": 15.782885551452637, + "max_norm/layer19": 15.452775001525879, + "max_norm/layer2": 13.689221382141113, + "max_norm/layer20": 16.361042022705078, + "max_norm/layer21": 16.02024269104004, + "max_norm/layer22": 16.25684928894043, + "max_norm/layer23": 16.14984703063965, + "max_norm/layer3": 15.28460693359375, + "max_norm/layer4": 15.529900550842285, + "max_norm/layer5": 17.570619583129883, + "max_norm/layer6": 14.70571231842041, + "max_norm/layer7": 16.162504196166992, + "max_norm/layer8": 16.585596084594727, + "max_norm/layer9": 16.349956512451172, + "mean_norm": 9.248786879082521, + "mean_norm/layer0": 8.861954629421234, + "mean_norm/layer1": 8.930564403533936, + "mean_norm/layer10": 9.202419340610504, + "mean_norm/layer11": 9.334671199321747, + "mean_norm/layer12": 9.51488173007965, + "mean_norm/layer13": 9.152113914489746, + "mean_norm/layer14": 9.353131890296936, + "mean_norm/layer15": 9.487328350543976, + "mean_norm/layer16": 9.201062262058258, + "mean_norm/layer17": 9.458812892436981, + "mean_norm/layer18": 9.247539579868317, + "mean_norm/layer19": 9.259144306182861, + "mean_norm/layer2": 8.413836479187012, + "mean_norm/layer20": 9.347349166870117, + "mean_norm/layer21": 9.308494091033936, + "mean_norm/layer22": 9.74064427614212, + "mean_norm/layer23": 9.721216857433319, + "mean_norm/layer3": 9.432927966117859, + "mean_norm/layer4": 8.961803197860718, + "mean_norm/layer5": 9.979026854038239, + "mean_norm/layer6": 8.738053262233734, + "mean_norm/layer7": 8.977501392364502, + "mean_norm/layer8": 9.185922145843506, + "mean_norm/layer9": 9.160484910011292, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3150 + }, + { + "epoch": 1.32, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44814089225814563, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.843223810195923, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8154, + "eval_samples_per_second": 20.397, + "eval_steps_per_second": 0.677, + "step": 3150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.34, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8437, + "max_norm": 17.70356559753418, + "max_norm/layer0": 15.250068664550781, + "max_norm/layer1": 15.979663848876953, + "max_norm/layer10": 16.79854965209961, + "max_norm/layer11": 16.147912979125977, + "max_norm/layer12": 16.560741424560547, + "max_norm/layer13": 14.95504379272461, + "max_norm/layer14": 16.233966827392578, + "max_norm/layer15": 17.285449981689453, + "max_norm/layer16": 15.354681015014648, + "max_norm/layer17": 17.01114273071289, + "max_norm/layer18": 15.888689994812012, + "max_norm/layer19": 15.555651664733887, + "max_norm/layer2": 13.74233341217041, + "max_norm/layer20": 16.473976135253906, + "max_norm/layer21": 16.12687873840332, + "max_norm/layer22": 16.351245880126953, + "max_norm/layer23": 16.270776748657227, + "max_norm/layer3": 15.34660530090332, + "max_norm/layer4": 15.623671531677246, + "max_norm/layer5": 17.70356559753418, + "max_norm/layer6": 14.763014793395996, + "max_norm/layer7": 16.251935958862305, + "max_norm/layer8": 16.690643310546875, + "max_norm/layer9": 16.44407844543457, + "mean_norm": 9.263032605250677, + "mean_norm/layer0": 8.873132646083832, + "mean_norm/layer1": 8.94136381149292, + "mean_norm/layer10": 9.215128123760223, + "mean_norm/layer11": 9.349354445934296, + "mean_norm/layer12": 9.532716155052185, + "mean_norm/layer13": 9.165308952331543, + "mean_norm/layer14": 9.368605971336365, + "mean_norm/layer15": 9.50459748506546, + "mean_norm/layer16": 9.215272843837738, + "mean_norm/layer17": 9.476195633411407, + "mean_norm/layer18": 9.262809813022614, + "mean_norm/layer19": 9.27439969778061, + "mean_norm/layer2": 8.417843043804169, + "mean_norm/layer20": 9.363462388515472, + "mean_norm/layer21": 9.324271738529205, + "mean_norm/layer22": 9.761922836303711, + "mean_norm/layer23": 9.74175089597702, + "mean_norm/layer3": 9.448581278324127, + "mean_norm/layer4": 8.971577763557434, + "mean_norm/layer5": 10.000657439231873, + "mean_norm/layer6": 8.745424628257751, + "mean_norm/layer7": 8.987475097179413, + "mean_norm/layer8": 9.198350310325623, + "mean_norm/layer9": 9.172579526901245, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3200 + }, + { + "epoch": 1.34, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.447702834799609, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8433425426483154, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.819, + "eval_samples_per_second": 20.391, + "eval_steps_per_second": 0.677, + "step": 3200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.36, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8519, + "max_norm": 17.860597610473633, + "max_norm/layer0": 15.346634864807129, + "max_norm/layer1": 16.065568923950195, + "max_norm/layer10": 16.915620803833008, + "max_norm/layer11": 16.206560134887695, + "max_norm/layer12": 16.65528106689453, + "max_norm/layer13": 15.02581787109375, + "max_norm/layer14": 16.34491539001465, + "max_norm/layer15": 17.41537094116211, + "max_norm/layer16": 15.447769165039062, + "max_norm/layer17": 17.1556339263916, + "max_norm/layer18": 15.984742164611816, + "max_norm/layer19": 15.66572380065918, + "max_norm/layer2": 13.785428047180176, + "max_norm/layer20": 16.59414291381836, + "max_norm/layer21": 16.224258422851562, + "max_norm/layer22": 16.447364807128906, + "max_norm/layer23": 16.371061325073242, + "max_norm/layer3": 15.438834190368652, + "max_norm/layer4": 15.713982582092285, + "max_norm/layer5": 17.860597610473633, + "max_norm/layer6": 14.833402633666992, + "max_norm/layer7": 16.37326431274414, + "max_norm/layer8": 16.806903839111328, + "max_norm/layer9": 16.539751052856445, + "mean_norm": 9.277176524202028, + "mean_norm/layer0": 8.884214758872986, + "mean_norm/layer1": 8.952378034591675, + "mean_norm/layer10": 9.227916955947876, + "mean_norm/layer11": 9.363875806331635, + "mean_norm/layer12": 9.550445020198822, + "mean_norm/layer13": 9.178218245506287, + "mean_norm/layer14": 9.384025871753693, + "mean_norm/layer15": 9.521648645401001, + "mean_norm/layer16": 9.22939395904541, + "mean_norm/layer17": 9.493267953395844, + "mean_norm/layer18": 9.277807056903839, + "mean_norm/layer19": 9.289763867855072, + "mean_norm/layer2": 8.421853244304657, + "mean_norm/layer20": 9.379169642925262, + "mean_norm/layer21": 9.339562237262726, + "mean_norm/layer22": 9.782929956912994, + "mean_norm/layer23": 9.762168943881989, + "mean_norm/layer3": 9.464285552501678, + "mean_norm/layer4": 8.981122076511383, + "mean_norm/layer5": 10.022289276123047, + "mean_norm/layer6": 8.752665579319, + "mean_norm/layer7": 8.997315227985382, + "mean_norm/layer8": 9.211067497730255, + "mean_norm/layer9": 9.184851169586182, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3250 + }, + { + "epoch": 1.36, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44898455847458657, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8393099308013916, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8059, + "eval_samples_per_second": 20.413, + "eval_steps_per_second": 0.678, + "step": 3250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.38, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8446, + "max_norm": 18.016963958740234, + "max_norm/layer0": 15.441362380981445, + "max_norm/layer1": 16.141338348388672, + "max_norm/layer10": 17.031034469604492, + "max_norm/layer11": 16.273303985595703, + "max_norm/layer12": 16.74533462524414, + "max_norm/layer13": 15.093159675598145, + "max_norm/layer14": 16.452301025390625, + "max_norm/layer15": 17.527395248413086, + "max_norm/layer16": 15.512605667114258, + "max_norm/layer17": 17.280061721801758, + "max_norm/layer18": 16.084121704101562, + "max_norm/layer19": 15.759353637695312, + "max_norm/layer2": 13.81966781616211, + "max_norm/layer20": 16.718875885009766, + "max_norm/layer21": 16.32035255432129, + "max_norm/layer22": 16.567575454711914, + "max_norm/layer23": 16.46967124938965, + "max_norm/layer3": 15.51447582244873, + "max_norm/layer4": 15.789702415466309, + "max_norm/layer5": 18.016963958740234, + "max_norm/layer6": 14.896657943725586, + "max_norm/layer7": 16.477813720703125, + "max_norm/layer8": 16.922813415527344, + "max_norm/layer9": 16.6334171295166, + "mean_norm": 9.290889439483484, + "mean_norm/layer0": 8.895033597946167, + "mean_norm/layer1": 8.963081002235413, + "mean_norm/layer10": 9.240162551403046, + "mean_norm/layer11": 9.377988994121552, + "mean_norm/layer12": 9.567772030830383, + "mean_norm/layer13": 9.190891683101654, + "mean_norm/layer14": 9.399105072021484, + "mean_norm/layer15": 9.538142681121826, + "mean_norm/layer16": 9.24304586648941, + "mean_norm/layer17": 9.510010719299316, + "mean_norm/layer18": 9.292459189891815, + "mean_norm/layer19": 9.304514169692993, + "mean_norm/layer2": 8.425727248191833, + "mean_norm/layer20": 9.394480288028717, + "mean_norm/layer21": 9.354299426078796, + "mean_norm/layer22": 9.803248167037964, + "mean_norm/layer23": 9.781766414642334, + "mean_norm/layer3": 9.47944289445877, + "mean_norm/layer4": 8.990542650222778, + "mean_norm/layer5": 10.04342132806778, + "mean_norm/layer6": 8.759501457214355, + "mean_norm/layer7": 9.006960988044739, + "mean_norm/layer8": 9.223146975040436, + "mean_norm/layer9": 9.196601152420044, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3300 + }, + { + "epoch": 1.38, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44939016723249087, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8373703956604004, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8356, + "eval_samples_per_second": 20.362, + "eval_steps_per_second": 0.676, + "step": 3300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.4, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8313, + "max_norm": 18.179218292236328, + "max_norm/layer0": 15.533577919006348, + "max_norm/layer1": 16.243879318237305, + "max_norm/layer10": 17.173385620117188, + "max_norm/layer11": 16.345731735229492, + "max_norm/layer12": 16.848569869995117, + "max_norm/layer13": 15.166905403137207, + "max_norm/layer14": 16.53302764892578, + "max_norm/layer15": 17.655122756958008, + "max_norm/layer16": 15.596038818359375, + "max_norm/layer17": 17.404146194458008, + "max_norm/layer18": 16.180326461791992, + "max_norm/layer19": 15.84206485748291, + "max_norm/layer2": 13.853592872619629, + "max_norm/layer20": 16.853952407836914, + "max_norm/layer21": 16.416898727416992, + "max_norm/layer22": 16.667673110961914, + "max_norm/layer23": 16.5629940032959, + "max_norm/layer3": 15.585241317749023, + "max_norm/layer4": 15.886917114257812, + "max_norm/layer5": 18.179218292236328, + "max_norm/layer6": 14.965940475463867, + "max_norm/layer7": 16.574649810791016, + "max_norm/layer8": 17.033422470092773, + "max_norm/layer9": 16.74019432067871, + "mean_norm": 9.304636073609194, + "mean_norm/layer0": 8.90590125322342, + "mean_norm/layer1": 8.973723888397217, + "mean_norm/layer10": 9.252578437328339, + "mean_norm/layer11": 9.392187356948853, + "mean_norm/layer12": 9.584810256958008, + "mean_norm/layer13": 9.203449964523315, + "mean_norm/layer14": 9.413988173007965, + "mean_norm/layer15": 9.554635107517242, + "mean_norm/layer16": 9.25671535730362, + "mean_norm/layer17": 9.526697039604187, + "mean_norm/layer18": 9.306841850280762, + "mean_norm/layer19": 9.31952553987503, + "mean_norm/layer2": 8.429565906524658, + "mean_norm/layer20": 9.409839034080505, + "mean_norm/layer21": 9.369287729263306, + "mean_norm/layer22": 9.82382595539093, + "mean_norm/layer23": 9.801779389381409, + "mean_norm/layer3": 9.494613111019135, + "mean_norm/layer4": 8.999967634677887, + "mean_norm/layer5": 10.064538836479187, + "mean_norm/layer6": 8.766620993614197, + "mean_norm/layer7": 9.016564190387726, + "mean_norm/layer8": 9.235347211360931, + "mean_norm/layer9": 9.208261549472809, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3350 + }, + { + "epoch": 1.4, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4490372876131141, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8347883224487305, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.7963, + "eval_samples_per_second": 22.322, + "eval_steps_per_second": 0.741, + "step": 3350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.42, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8251, + "max_norm": 18.336759567260742, + "max_norm/layer0": 15.618881225585938, + "max_norm/layer1": 16.339771270751953, + "max_norm/layer10": 17.287466049194336, + "max_norm/layer11": 16.401472091674805, + "max_norm/layer12": 16.958864212036133, + "max_norm/layer13": 15.245092391967773, + "max_norm/layer14": 16.62425994873047, + "max_norm/layer15": 17.777263641357422, + "max_norm/layer16": 15.674489974975586, + "max_norm/layer17": 17.523509979248047, + "max_norm/layer18": 16.255813598632812, + "max_norm/layer19": 15.934908866882324, + "max_norm/layer2": 13.882692337036133, + "max_norm/layer20": 16.969314575195312, + "max_norm/layer21": 16.508270263671875, + "max_norm/layer22": 16.763980865478516, + "max_norm/layer23": 16.67099380493164, + "max_norm/layer3": 15.66022777557373, + "max_norm/layer4": 15.979378700256348, + "max_norm/layer5": 18.336759567260742, + "max_norm/layer6": 15.03795337677002, + "max_norm/layer7": 16.673524856567383, + "max_norm/layer8": 17.149028778076172, + "max_norm/layer9": 16.84016227722168, + "mean_norm": 9.318130704263845, + "mean_norm/layer0": 8.916600942611694, + "mean_norm/layer1": 8.984344899654388, + "mean_norm/layer10": 9.264764606952667, + "mean_norm/layer11": 9.40614765882492, + "mean_norm/layer12": 9.601603388786316, + "mean_norm/layer13": 9.216069042682648, + "mean_norm/layer14": 9.428646862506866, + "mean_norm/layer15": 9.570810496807098, + "mean_norm/layer16": 9.27027541399002, + "mean_norm/layer17": 9.542983949184418, + "mean_norm/layer18": 9.321069478988647, + "mean_norm/layer19": 9.3338503241539, + "mean_norm/layer2": 8.43327808380127, + "mean_norm/layer20": 9.42466515302658, + "mean_norm/layer21": 9.383947730064392, + "mean_norm/layer22": 9.844399809837341, + "mean_norm/layer23": 9.821134805679321, + "mean_norm/layer3": 9.50949090719223, + "mean_norm/layer4": 9.009099662303925, + "mean_norm/layer5": 10.085379660129547, + "mean_norm/layer6": 8.773491621017456, + "mean_norm/layer7": 9.025936245918274, + "mean_norm/layer8": 9.247284710407257, + "mean_norm/layer9": 9.219861447811127, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3400 + }, + { + "epoch": 1.42, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.44893588542363805, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8318352699279785, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6041, + "eval_samples_per_second": 20.769, + "eval_steps_per_second": 0.689, + "step": 3400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.44, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8429, + "max_norm": 18.477962493896484, + "max_norm/layer0": 15.704484939575195, + "max_norm/layer1": 16.429656982421875, + "max_norm/layer10": 17.405029296875, + "max_norm/layer11": 16.489473342895508, + "max_norm/layer12": 17.07954978942871, + "max_norm/layer13": 15.339924812316895, + "max_norm/layer14": 16.736328125, + "max_norm/layer15": 17.899723052978516, + "max_norm/layer16": 15.776835441589355, + "max_norm/layer17": 17.662168502807617, + "max_norm/layer18": 16.360383987426758, + "max_norm/layer19": 16.030488967895508, + "max_norm/layer2": 13.910673141479492, + "max_norm/layer20": 17.0791015625, + "max_norm/layer21": 16.60880470275879, + "max_norm/layer22": 16.860157012939453, + "max_norm/layer23": 16.763296127319336, + "max_norm/layer3": 15.720104217529297, + "max_norm/layer4": 16.067779541015625, + "max_norm/layer5": 18.477962493896484, + "max_norm/layer6": 15.11044979095459, + "max_norm/layer7": 16.761457443237305, + "max_norm/layer8": 17.262792587280273, + "max_norm/layer9": 16.94117546081543, + "mean_norm": 9.331590088705221, + "mean_norm/layer0": 8.927314579486847, + "mean_norm/layer1": 8.99471640586853, + "mean_norm/layer10": 9.277050256729126, + "mean_norm/layer11": 9.420108437538147, + "mean_norm/layer12": 9.61855810880661, + "mean_norm/layer13": 9.22856056690216, + "mean_norm/layer14": 9.443263828754425, + "mean_norm/layer15": 9.586838006973267, + "mean_norm/layer16": 9.283744394779205, + "mean_norm/layer17": 9.559471309185028, + "mean_norm/layer18": 9.335309386253357, + "mean_norm/layer19": 9.348252415657043, + "mean_norm/layer2": 8.4369957447052, + "mean_norm/layer20": 9.439510464668274, + "mean_norm/layer21": 9.398659586906433, + "mean_norm/layer22": 9.864253401756287, + "mean_norm/layer23": 9.840354681015015, + "mean_norm/layer3": 9.524330019950867, + "mean_norm/layer4": 9.01804405450821, + "mean_norm/layer5": 10.106251001358032, + "mean_norm/layer6": 8.780368089675903, + "mean_norm/layer7": 9.035491406917572, + "mean_norm/layer8": 9.259211540222168, + "mean_norm/layer9": 9.231504440307617, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3450 + }, + { + "epoch": 1.44, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4497430468518676, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.828789472579956, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.7908, + "eval_samples_per_second": 22.334, + "eval_steps_per_second": 0.741, + "step": 3450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.46, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8397, + "max_norm": 18.612791061401367, + "max_norm/layer0": 15.785677909851074, + "max_norm/layer1": 16.514942169189453, + "max_norm/layer10": 17.51824951171875, + "max_norm/layer11": 16.590362548828125, + "max_norm/layer12": 17.19257354736328, + "max_norm/layer13": 15.409317970275879, + "max_norm/layer14": 16.837434768676758, + "max_norm/layer15": 17.997446060180664, + "max_norm/layer16": 15.877601623535156, + "max_norm/layer17": 17.79769515991211, + "max_norm/layer18": 16.465822219848633, + "max_norm/layer19": 16.119728088378906, + "max_norm/layer2": 13.954423904418945, + "max_norm/layer20": 17.191173553466797, + "max_norm/layer21": 16.693696975708008, + "max_norm/layer22": 16.954496383666992, + "max_norm/layer23": 16.847951889038086, + "max_norm/layer3": 15.772260665893555, + "max_norm/layer4": 16.147335052490234, + "max_norm/layer5": 18.612791061401367, + "max_norm/layer6": 15.16303825378418, + "max_norm/layer7": 16.8575439453125, + "max_norm/layer8": 17.3731689453125, + "max_norm/layer9": 17.055498123168945, + "mean_norm": 9.344837203621864, + "mean_norm/layer0": 8.937843799591064, + "mean_norm/layer1": 9.005088448524475, + "mean_norm/layer10": 9.289023041725159, + "mean_norm/layer11": 9.433656215667725, + "mean_norm/layer12": 9.635209679603577, + "mean_norm/layer13": 9.24088716506958, + "mean_norm/layer14": 9.457638919353485, + "mean_norm/layer15": 9.602668046951294, + "mean_norm/layer16": 9.296828985214233, + "mean_norm/layer17": 9.575341761112213, + "mean_norm/layer18": 9.349262356758118, + "mean_norm/layer19": 9.362391829490662, + "mean_norm/layer2": 8.44077605009079, + "mean_norm/layer20": 9.454284369945526, + "mean_norm/layer21": 9.413063526153564, + "mean_norm/layer22": 9.883745014667511, + "mean_norm/layer23": 9.859206199645996, + "mean_norm/layer3": 9.539020895957947, + "mean_norm/layer4": 9.027145206928253, + "mean_norm/layer5": 10.12680846452713, + "mean_norm/layer6": 8.787212014198303, + "mean_norm/layer7": 9.044856607913971, + "mean_norm/layer8": 9.271096289157867, + "mean_norm/layer9": 9.2430379986763, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3500 + }, + { + "epoch": 1.46, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4511099483660051, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8216705322265625, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.563, + "eval_samples_per_second": 20.842, + "eval_steps_per_second": 0.692, + "step": 3500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.48, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.833, + "max_norm": 18.753446578979492, + "max_norm/layer0": 15.853753089904785, + "max_norm/layer1": 16.583667755126953, + "max_norm/layer10": 17.616392135620117, + "max_norm/layer11": 16.686279296875, + "max_norm/layer12": 17.2836856842041, + "max_norm/layer13": 15.484760284423828, + "max_norm/layer14": 16.939178466796875, + "max_norm/layer15": 18.10690689086914, + "max_norm/layer16": 15.978145599365234, + "max_norm/layer17": 17.911317825317383, + "max_norm/layer18": 16.60814666748047, + "max_norm/layer19": 16.217397689819336, + "max_norm/layer2": 13.995329856872559, + "max_norm/layer20": 17.310771942138672, + "max_norm/layer21": 16.784269332885742, + "max_norm/layer22": 17.0494384765625, + "max_norm/layer23": 16.949352264404297, + "max_norm/layer3": 15.835954666137695, + "max_norm/layer4": 16.24813461303711, + "max_norm/layer5": 18.753446578979492, + "max_norm/layer6": 15.2390718460083, + "max_norm/layer7": 16.97339630126953, + "max_norm/layer8": 17.472185134887695, + "max_norm/layer9": 17.17030906677246, + "mean_norm": 9.358108803629875, + "mean_norm/layer0": 8.948367297649384, + "mean_norm/layer1": 9.015483260154724, + "mean_norm/layer10": 9.300959289073944, + "mean_norm/layer11": 9.44746309518814, + "mean_norm/layer12": 9.651969850063324, + "mean_norm/layer13": 9.253294944763184, + "mean_norm/layer14": 9.472301483154297, + "mean_norm/layer15": 9.618704080581665, + "mean_norm/layer16": 9.310149073600769, + "mean_norm/layer17": 9.591234683990479, + "mean_norm/layer18": 9.36311811208725, + "mean_norm/layer19": 9.376516222953796, + "mean_norm/layer2": 8.444473266601562, + "mean_norm/layer20": 9.46895295381546, + "mean_norm/layer21": 9.42733383178711, + "mean_norm/layer22": 9.903033971786499, + "mean_norm/layer23": 9.87805551290512, + "mean_norm/layer3": 9.553642868995667, + "mean_norm/layer4": 9.036168217658997, + "mean_norm/layer5": 10.147434830665588, + "mean_norm/layer6": 8.794258058071136, + "mean_norm/layer7": 9.054118037223816, + "mean_norm/layer8": 9.283077836036682, + "mean_norm/layer9": 9.25450050830841, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3550 + }, + { + "epoch": 1.48, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4499134025301874, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.825397253036499, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8024, + "eval_samples_per_second": 20.42, + "eval_steps_per_second": 0.678, + "step": 3550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.5, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8209, + "max_norm": 18.887266159057617, + "max_norm/layer0": 15.928442001342773, + "max_norm/layer1": 16.638465881347656, + "max_norm/layer10": 17.713111877441406, + "max_norm/layer11": 16.772506713867188, + "max_norm/layer12": 17.393291473388672, + "max_norm/layer13": 15.576926231384277, + "max_norm/layer14": 17.04795265197754, + "max_norm/layer15": 18.229637145996094, + "max_norm/layer16": 16.101669311523438, + "max_norm/layer17": 18.021533966064453, + "max_norm/layer18": 16.741031646728516, + "max_norm/layer19": 16.309358596801758, + "max_norm/layer2": 14.079461097717285, + "max_norm/layer20": 17.407546997070312, + "max_norm/layer21": 16.90997314453125, + "max_norm/layer22": 17.160221099853516, + "max_norm/layer23": 17.035873413085938, + "max_norm/layer3": 15.932682991027832, + "max_norm/layer4": 16.348690032958984, + "max_norm/layer5": 18.887266159057617, + "max_norm/layer6": 15.295527458190918, + "max_norm/layer7": 17.097925186157227, + "max_norm/layer8": 17.554088592529297, + "max_norm/layer9": 17.282934188842773, + "mean_norm": 9.371505024532476, + "mean_norm/layer0": 8.959096014499664, + "mean_norm/layer1": 9.026121318340302, + "mean_norm/layer10": 9.313242495059967, + "mean_norm/layer11": 9.461414635181427, + "mean_norm/layer12": 9.668856620788574, + "mean_norm/layer13": 9.265742599964142, + "mean_norm/layer14": 9.486914694309235, + "mean_norm/layer15": 9.634682357311249, + "mean_norm/layer16": 9.323372840881348, + "mean_norm/layer17": 9.60727709531784, + "mean_norm/layer18": 9.377022087574005, + "mean_norm/layer19": 9.390734195709229, + "mean_norm/layer2": 8.448146045207977, + "mean_norm/layer20": 9.483981490135193, + "mean_norm/layer21": 9.441752195358276, + "mean_norm/layer22": 9.922874212265015, + "mean_norm/layer23": 9.897243618965149, + "mean_norm/layer3": 9.568353295326233, + "mean_norm/layer4": 9.04521918296814, + "mean_norm/layer5": 10.168164014816284, + "mean_norm/layer6": 8.801159620285034, + "mean_norm/layer7": 9.063514709472656, + "mean_norm/layer8": 9.295092165470123, + "mean_norm/layer9": 9.266143083572388, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3600 + }, + { + "epoch": 1.5, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45093148051252724, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8219504356384277, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7946, + "eval_samples_per_second": 20.433, + "eval_steps_per_second": 0.678, + "step": 3600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.52, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8336, + "max_norm": 19.024261474609375, + "max_norm/layer0": 16.005525588989258, + "max_norm/layer1": 16.7034854888916, + "max_norm/layer10": 17.81429100036621, + "max_norm/layer11": 16.852542877197266, + "max_norm/layer12": 17.491962432861328, + "max_norm/layer13": 15.668417930603027, + "max_norm/layer14": 17.154603958129883, + "max_norm/layer15": 18.34808921813965, + "max_norm/layer16": 16.209043502807617, + "max_norm/layer17": 18.15737533569336, + "max_norm/layer18": 16.833559036254883, + "max_norm/layer19": 16.41221046447754, + "max_norm/layer2": 14.156972885131836, + "max_norm/layer20": 17.505290985107422, + "max_norm/layer21": 17.016029357910156, + "max_norm/layer22": 17.268396377563477, + "max_norm/layer23": 17.125720977783203, + "max_norm/layer3": 16.029821395874023, + "max_norm/layer4": 16.439924240112305, + "max_norm/layer5": 19.024261474609375, + "max_norm/layer6": 15.357059478759766, + "max_norm/layer7": 17.220069885253906, + "max_norm/layer8": 17.65226173400879, + "max_norm/layer9": 17.398624420166016, + "mean_norm": 9.384601970513662, + "mean_norm/layer0": 8.969634473323822, + "mean_norm/layer1": 9.036478281021118, + "mean_norm/layer10": 9.325130581855774, + "mean_norm/layer11": 9.475057005882263, + "mean_norm/layer12": 9.685044169425964, + "mean_norm/layer13": 9.277792394161224, + "mean_norm/layer14": 9.501095294952393, + "mean_norm/layer15": 9.650285363197327, + "mean_norm/layer16": 9.336541652679443, + "mean_norm/layer17": 9.623004257678986, + "mean_norm/layer18": 9.390738606452942, + "mean_norm/layer19": 9.404767334461212, + "mean_norm/layer2": 8.451732337474823, + "mean_norm/layer20": 9.498468458652496, + "mean_norm/layer21": 9.456099450588226, + "mean_norm/layer22": 9.942264795303345, + "mean_norm/layer23": 9.915738880634308, + "mean_norm/layer3": 9.582852602005005, + "mean_norm/layer4": 9.054056227207184, + "mean_norm/layer5": 10.188653767108917, + "mean_norm/layer6": 8.807803988456726, + "mean_norm/layer7": 9.072685480117798, + "mean_norm/layer8": 9.306782305240631, + "mean_norm/layer9": 9.277739584445953, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3650 + }, + { + "epoch": 1.52, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45114645315421653, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8175899982452393, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5432, + "eval_samples_per_second": 20.878, + "eval_steps_per_second": 0.693, + "step": 3650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.54, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8139, + "max_norm": 19.137977600097656, + "max_norm/layer0": 16.0833740234375, + "max_norm/layer1": 16.776784896850586, + "max_norm/layer10": 17.91156578063965, + "max_norm/layer11": 16.949214935302734, + "max_norm/layer12": 17.602840423583984, + "max_norm/layer13": 15.76510238647461, + "max_norm/layer14": 17.248186111450195, + "max_norm/layer15": 18.48503303527832, + "max_norm/layer16": 16.319406509399414, + "max_norm/layer17": 18.264812469482422, + "max_norm/layer18": 16.932689666748047, + "max_norm/layer19": 16.511192321777344, + "max_norm/layer2": 14.22626781463623, + "max_norm/layer20": 17.621082305908203, + "max_norm/layer21": 17.110122680664062, + "max_norm/layer22": 17.374183654785156, + "max_norm/layer23": 17.20750617980957, + "max_norm/layer3": 16.11916732788086, + "max_norm/layer4": 16.518123626708984, + "max_norm/layer5": 19.137977600097656, + "max_norm/layer6": 15.443400382995605, + "max_norm/layer7": 17.33040428161621, + "max_norm/layer8": 17.752338409423828, + "max_norm/layer9": 17.495275497436523, + "mean_norm": 9.39769247919321, + "mean_norm/layer0": 8.980181157588959, + "mean_norm/layer1": 9.046735346317291, + "mean_norm/layer10": 9.337104260921478, + "mean_norm/layer11": 9.48857319355011, + "mean_norm/layer12": 9.701455056667328, + "mean_norm/layer13": 9.290168941020966, + "mean_norm/layer14": 9.51529061794281, + "mean_norm/layer15": 9.665862381458282, + "mean_norm/layer16": 9.349638223648071, + "mean_norm/layer17": 9.638719916343689, + "mean_norm/layer18": 9.40440809726715, + "mean_norm/layer19": 9.418926656246185, + "mean_norm/layer2": 8.45537531375885, + "mean_norm/layer20": 9.513044118881226, + "mean_norm/layer21": 9.470202088356018, + "mean_norm/layer22": 9.961255609989166, + "mean_norm/layer23": 9.934356808662415, + "mean_norm/layer3": 9.597356498241425, + "mean_norm/layer4": 9.062905848026276, + "mean_norm/layer5": 10.208882927894592, + "mean_norm/layer6": 8.814568221569061, + "mean_norm/layer7": 9.08190244436264, + "mean_norm/layer8": 9.31855446100235, + "mean_norm/layer9": 9.289151310920715, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3700 + }, + { + "epoch": 1.54, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45146282798538184, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8167974948883057, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5485, + "eval_samples_per_second": 20.869, + "eval_steps_per_second": 0.693, + "step": 3700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.57, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8155, + "max_norm": 19.25054931640625, + "max_norm/layer0": 16.164255142211914, + "max_norm/layer1": 16.874256134033203, + "max_norm/layer10": 18.021665573120117, + "max_norm/layer11": 17.04458236694336, + "max_norm/layer12": 17.710533142089844, + "max_norm/layer13": 15.850334167480469, + "max_norm/layer14": 17.3418025970459, + "max_norm/layer15": 18.614669799804688, + "max_norm/layer16": 16.4307804107666, + "max_norm/layer17": 18.387475967407227, + "max_norm/layer18": 17.02359390258789, + "max_norm/layer19": 16.638124465942383, + "max_norm/layer2": 14.282529830932617, + "max_norm/layer20": 17.732723236083984, + "max_norm/layer21": 17.204208374023438, + "max_norm/layer22": 17.47235870361328, + "max_norm/layer23": 17.30570411682129, + "max_norm/layer3": 16.197643280029297, + "max_norm/layer4": 16.596391677856445, + "max_norm/layer5": 19.25054931640625, + "max_norm/layer6": 15.518656730651855, + "max_norm/layer7": 17.450822830200195, + "max_norm/layer8": 17.837682723999023, + "max_norm/layer9": 17.59002685546875, + "mean_norm": 9.410545006394386, + "mean_norm/layer0": 8.99051821231842, + "mean_norm/layer1": 9.056912958621979, + "mean_norm/layer10": 9.348880767822266, + "mean_norm/layer11": 9.501977682113647, + "mean_norm/layer12": 9.717777132987976, + "mean_norm/layer13": 9.302150130271912, + "mean_norm/layer14": 9.52913784980774, + "mean_norm/layer15": 9.681376457214355, + "mean_norm/layer16": 9.362551271915436, + "mean_norm/layer17": 9.654209911823273, + "mean_norm/layer18": 9.417977392673492, + "mean_norm/layer19": 9.432604491710663, + "mean_norm/layer2": 8.458954632282257, + "mean_norm/layer20": 9.526868760585785, + "mean_norm/layer21": 9.484004497528076, + "mean_norm/layer22": 9.980139374732971, + "mean_norm/layer23": 9.952777981758118, + "mean_norm/layer3": 9.611551821231842, + "mean_norm/layer4": 9.071687638759613, + "mean_norm/layer5": 10.228794932365417, + "mean_norm/layer6": 8.821084141731262, + "mean_norm/layer7": 9.090995073318481, + "mean_norm/layer8": 9.329946517944336, + "mean_norm/layer9": 9.300200521945953, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3750 + }, + { + "epoch": 1.57, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4517873149917053, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.812666177749634, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7797, + "eval_samples_per_second": 20.459, + "eval_steps_per_second": 0.679, + "step": 3750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.59, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8196, + "max_norm": 19.39119529724121, + "max_norm/layer0": 16.249656677246094, + "max_norm/layer1": 16.963245391845703, + "max_norm/layer10": 18.125328063964844, + "max_norm/layer11": 17.15520477294922, + "max_norm/layer12": 17.828350067138672, + "max_norm/layer13": 15.930174827575684, + "max_norm/layer14": 17.422183990478516, + "max_norm/layer15": 18.75629997253418, + "max_norm/layer16": 16.539464950561523, + "max_norm/layer17": 18.515911102294922, + "max_norm/layer18": 17.11224365234375, + "max_norm/layer19": 16.767332077026367, + "max_norm/layer2": 14.359777450561523, + "max_norm/layer20": 17.840478897094727, + "max_norm/layer21": 17.309904098510742, + "max_norm/layer22": 17.559303283691406, + "max_norm/layer23": 17.389223098754883, + "max_norm/layer3": 16.30811309814453, + "max_norm/layer4": 16.692081451416016, + "max_norm/layer5": 19.39119529724121, + "max_norm/layer6": 15.620407104492188, + "max_norm/layer7": 17.557313919067383, + "max_norm/layer8": 17.944181442260742, + "max_norm/layer9": 17.681028366088867, + "mean_norm": 9.423318974673748, + "mean_norm/layer0": 9.000839114189148, + "mean_norm/layer1": 9.066909670829773, + "mean_norm/layer10": 9.36047077178955, + "mean_norm/layer11": 9.515274345874786, + "mean_norm/layer12": 9.733893871307373, + "mean_norm/layer13": 9.31408303976059, + "mean_norm/layer14": 9.542948007583618, + "mean_norm/layer15": 9.696711778640747, + "mean_norm/layer16": 9.375279724597931, + "mean_norm/layer17": 9.66939002275467, + "mean_norm/layer18": 9.431337356567383, + "mean_norm/layer19": 9.446298122406006, + "mean_norm/layer2": 8.462641179561615, + "mean_norm/layer20": 9.540704071521759, + "mean_norm/layer21": 9.49764209985733, + "mean_norm/layer22": 9.998992681503296, + "mean_norm/layer23": 9.971072018146515, + "mean_norm/layer3": 9.62577337026596, + "mean_norm/layer4": 9.08018147945404, + "mean_norm/layer5": 10.248691976070404, + "mean_norm/layer6": 8.82778912782669, + "mean_norm/layer7": 9.100020945072174, + "mean_norm/layer8": 9.34142941236496, + "mean_norm/layer9": 9.311281204223633, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3800 + }, + { + "epoch": 1.59, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4525701398944606, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8062896728515625, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.533, + "eval_samples_per_second": 20.896, + "eval_steps_per_second": 0.694, + "step": 3800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.61, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8083, + "max_norm": 19.52190589904785, + "max_norm/layer0": 16.348299026489258, + "max_norm/layer1": 17.05620574951172, + "max_norm/layer10": 18.23882293701172, + "max_norm/layer11": 17.240055084228516, + "max_norm/layer12": 17.929933547973633, + "max_norm/layer13": 16.006711959838867, + "max_norm/layer14": 17.513385772705078, + "max_norm/layer15": 18.893762588500977, + "max_norm/layer16": 16.633769989013672, + "max_norm/layer17": 18.641620635986328, + "max_norm/layer18": 17.20274543762207, + "max_norm/layer19": 16.888694763183594, + "max_norm/layer2": 14.43471908569336, + "max_norm/layer20": 17.956628799438477, + "max_norm/layer21": 17.431379318237305, + "max_norm/layer22": 17.653854370117188, + "max_norm/layer23": 17.478567123413086, + "max_norm/layer3": 16.408828735351562, + "max_norm/layer4": 16.770822525024414, + "max_norm/layer5": 19.52190589904785, + "max_norm/layer6": 15.692330360412598, + "max_norm/layer7": 17.65044403076172, + "max_norm/layer8": 18.09210777282715, + "max_norm/layer9": 17.78131103515625, + "mean_norm": 9.436038424571356, + "mean_norm/layer0": 9.01114821434021, + "mean_norm/layer1": 9.077042877674103, + "mean_norm/layer10": 9.372229039669037, + "mean_norm/layer11": 9.528716921806335, + "mean_norm/layer12": 9.750010967254639, + "mean_norm/layer13": 9.325950026512146, + "mean_norm/layer14": 9.556561589241028, + "mean_norm/layer15": 9.711856067180634, + "mean_norm/layer16": 9.387940168380737, + "mean_norm/layer17": 9.684573650360107, + "mean_norm/layer18": 9.444583415985107, + "mean_norm/layer19": 9.459890902042389, + "mean_norm/layer2": 8.466160774230957, + "mean_norm/layer20": 9.554618656635284, + "mean_norm/layer21": 9.511114656925201, + "mean_norm/layer22": 10.017443120479584, + "mean_norm/layer23": 9.9893519282341, + "mean_norm/layer3": 9.639805853366852, + "mean_norm/layer4": 9.088814616203308, + "mean_norm/layer5": 10.268649756908417, + "mean_norm/layer6": 8.834497690200806, + "mean_norm/layer7": 9.108858048915863, + "mean_norm/layer8": 9.352881073951721, + "mean_norm/layer9": 9.322222173213959, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3850 + }, + { + "epoch": 1.61, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4524444011795103, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.804806709289551, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7887, + "eval_samples_per_second": 20.443, + "eval_steps_per_second": 0.679, + "step": 3850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.63, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8202, + "max_norm": 19.663883209228516, + "max_norm/layer0": 16.442665100097656, + "max_norm/layer1": 17.14680290222168, + "max_norm/layer10": 18.334035873413086, + "max_norm/layer11": 17.328901290893555, + "max_norm/layer12": 18.035051345825195, + "max_norm/layer13": 16.093976974487305, + "max_norm/layer14": 17.588014602661133, + "max_norm/layer15": 19.004194259643555, + "max_norm/layer16": 16.748910903930664, + "max_norm/layer17": 18.775148391723633, + "max_norm/layer18": 17.282062530517578, + "max_norm/layer19": 16.9793758392334, + "max_norm/layer2": 14.499808311462402, + "max_norm/layer20": 18.059389114379883, + "max_norm/layer21": 17.545143127441406, + "max_norm/layer22": 17.755186080932617, + "max_norm/layer23": 17.595932006835938, + "max_norm/layer3": 16.477340698242188, + "max_norm/layer4": 16.84396743774414, + "max_norm/layer5": 19.663883209228516, + "max_norm/layer6": 15.78128433227539, + "max_norm/layer7": 17.734956741333008, + "max_norm/layer8": 18.204540252685547, + "max_norm/layer9": 17.8907527923584, + "mean_norm": 9.44852451235056, + "mean_norm/layer0": 9.02129864692688, + "mean_norm/layer1": 9.086955904960632, + "mean_norm/layer10": 9.383722841739655, + "mean_norm/layer11": 9.54167753458023, + "mean_norm/layer12": 9.765829026699066, + "mean_norm/layer13": 9.337481915950775, + "mean_norm/layer14": 9.57017594575882, + "mean_norm/layer15": 9.726840198040009, + "mean_norm/layer16": 9.400262773036957, + "mean_norm/layer17": 9.699501633644104, + "mean_norm/layer18": 9.457594335079193, + "mean_norm/layer19": 9.473425507545471, + "mean_norm/layer2": 8.469590187072754, + "mean_norm/layer20": 9.56819599866867, + "mean_norm/layer21": 9.52423882484436, + "mean_norm/layer22": 10.035979628562927, + "mean_norm/layer23": 10.007273077964783, + "mean_norm/layer3": 9.65359890460968, + "mean_norm/layer4": 9.097174227237701, + "mean_norm/layer5": 10.288195967674255, + "mean_norm/layer6": 8.840922951698303, + "mean_norm/layer7": 9.11753261089325, + "mean_norm/layer8": 9.364024937152863, + "mean_norm/layer9": 9.333094716072083, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3900 + }, + { + "epoch": 1.63, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45347870351216624, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.798917770385742, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5468, + "eval_samples_per_second": 20.872, + "eval_steps_per_second": 0.693, + "step": 3900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.65, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8285, + "max_norm": 19.807249069213867, + "max_norm/layer0": 16.5258731842041, + "max_norm/layer1": 17.226022720336914, + "max_norm/layer10": 18.431427001953125, + "max_norm/layer11": 17.429719924926758, + "max_norm/layer12": 18.14910888671875, + "max_norm/layer13": 16.1771297454834, + "max_norm/layer14": 17.663759231567383, + "max_norm/layer15": 19.13890266418457, + "max_norm/layer16": 16.864423751831055, + "max_norm/layer17": 18.906938552856445, + "max_norm/layer18": 17.375585556030273, + "max_norm/layer19": 17.078645706176758, + "max_norm/layer2": 14.565903663635254, + "max_norm/layer20": 18.17165756225586, + "max_norm/layer21": 17.667926788330078, + "max_norm/layer22": 17.864042282104492, + "max_norm/layer23": 17.719139099121094, + "max_norm/layer3": 16.543764114379883, + "max_norm/layer4": 16.923555374145508, + "max_norm/layer5": 19.807249069213867, + "max_norm/layer6": 15.881307601928711, + "max_norm/layer7": 17.841663360595703, + "max_norm/layer8": 18.302600860595703, + "max_norm/layer9": 17.986249923706055, + "mean_norm": 9.460952490568161, + "mean_norm/layer0": 9.031491935253143, + "mean_norm/layer1": 9.096881031990051, + "mean_norm/layer10": 9.395167052745819, + "mean_norm/layer11": 9.554674923419952, + "mean_norm/layer12": 9.78170108795166, + "mean_norm/layer13": 9.348976492881775, + "mean_norm/layer14": 9.58379751443863, + "mean_norm/layer15": 9.741581797599792, + "mean_norm/layer16": 9.412635207176208, + "mean_norm/layer17": 9.714325428009033, + "mean_norm/layer18": 9.470487415790558, + "mean_norm/layer19": 9.48645406961441, + "mean_norm/layer2": 8.473007798194885, + "mean_norm/layer20": 9.581475257873535, + "mean_norm/layer21": 9.537485659122467, + "mean_norm/layer22": 10.05451250076294, + "mean_norm/layer23": 10.025010108947754, + "mean_norm/layer3": 9.667511641979218, + "mean_norm/layer4": 9.105651140213013, + "mean_norm/layer5": 10.307395875453949, + "mean_norm/layer6": 8.847305834293365, + "mean_norm/layer7": 9.126248717308044, + "mean_norm/layer8": 9.375205636024475, + "mean_norm/layer9": 9.343875646591187, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 3950 + }, + { + "epoch": 1.65, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4531826091188961, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.800121307373047, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8098, + "eval_samples_per_second": 20.407, + "eval_steps_per_second": 0.677, + "step": 3950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.67, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8144, + "max_norm": 19.9642276763916, + "max_norm/layer0": 16.61147117614746, + "max_norm/layer1": 17.310283660888672, + "max_norm/layer10": 18.5467472076416, + "max_norm/layer11": 17.51737403869629, + "max_norm/layer12": 18.284799575805664, + "max_norm/layer13": 16.269195556640625, + "max_norm/layer14": 17.733585357666016, + "max_norm/layer15": 19.260528564453125, + "max_norm/layer16": 16.976835250854492, + "max_norm/layer17": 19.035781860351562, + "max_norm/layer18": 17.47535514831543, + "max_norm/layer19": 17.174304962158203, + "max_norm/layer2": 14.622349739074707, + "max_norm/layer20": 18.276771545410156, + "max_norm/layer21": 17.77849769592285, + "max_norm/layer22": 17.960010528564453, + "max_norm/layer23": 17.830236434936523, + "max_norm/layer3": 16.622806549072266, + "max_norm/layer4": 16.99311637878418, + "max_norm/layer5": 19.9642276763916, + "max_norm/layer6": 15.971922874450684, + "max_norm/layer7": 17.943126678466797, + "max_norm/layer8": 18.38897132873535, + "max_norm/layer9": 18.076162338256836, + "mean_norm": 9.473361556728682, + "mean_norm/layer0": 9.041697025299072, + "mean_norm/layer1": 9.106783270835876, + "mean_norm/layer10": 9.40651547908783, + "mean_norm/layer11": 9.567744493484497, + "mean_norm/layer12": 9.79739373922348, + "mean_norm/layer13": 9.360623478889465, + "mean_norm/layer14": 9.59718006849289, + "mean_norm/layer15": 9.75637936592102, + "mean_norm/layer16": 9.424761176109314, + "mean_norm/layer17": 9.729040384292603, + "mean_norm/layer18": 9.483455121517181, + "mean_norm/layer19": 9.499560296535492, + "mean_norm/layer2": 8.476477980613708, + "mean_norm/layer20": 9.594904780387878, + "mean_norm/layer21": 9.55079185962677, + "mean_norm/layer22": 10.07281231880188, + "mean_norm/layer23": 10.042850077152252, + "mean_norm/layer3": 9.681340396404266, + "mean_norm/layer4": 9.11408942937851, + "mean_norm/layer5": 10.326896071434021, + "mean_norm/layer6": 8.85367339849472, + "mean_norm/layer7": 9.134850978851318, + "mean_norm/layer8": 9.386187195777893, + "mean_norm/layer9": 9.354668974876404, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4000 + }, + { + "epoch": 1.67, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45394920967133523, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.8009955883026123, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8157, + "eval_samples_per_second": 20.397, + "eval_steps_per_second": 0.677, + "step": 4000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.69, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.818, + "max_norm": 20.119094848632812, + "max_norm/layer0": 16.698545455932617, + "max_norm/layer1": 17.391803741455078, + "max_norm/layer10": 18.6510066986084, + "max_norm/layer11": 17.621688842773438, + "max_norm/layer12": 18.390403747558594, + "max_norm/layer13": 16.343536376953125, + "max_norm/layer14": 17.814393997192383, + "max_norm/layer15": 19.369619369506836, + "max_norm/layer16": 17.107633590698242, + "max_norm/layer17": 19.145732879638672, + "max_norm/layer18": 17.571773529052734, + "max_norm/layer19": 17.277477264404297, + "max_norm/layer2": 14.673759460449219, + "max_norm/layer20": 18.38888931274414, + "max_norm/layer21": 17.876964569091797, + "max_norm/layer22": 18.05607795715332, + "max_norm/layer23": 17.937580108642578, + "max_norm/layer3": 16.682743072509766, + "max_norm/layer4": 17.070730209350586, + "max_norm/layer5": 20.119094848632812, + "max_norm/layer6": 16.04961585998535, + "max_norm/layer7": 18.03361701965332, + "max_norm/layer8": 18.491865158081055, + "max_norm/layer9": 18.16168975830078, + "mean_norm": 9.485714507599672, + "mean_norm/layer0": 9.051836490631104, + "mean_norm/layer1": 9.116701900959015, + "mean_norm/layer10": 9.41792494058609, + "mean_norm/layer11": 9.58076012134552, + "mean_norm/layer12": 9.813140749931335, + "mean_norm/layer13": 9.37224268913269, + "mean_norm/layer14": 9.61046987771988, + "mean_norm/layer15": 9.771362841129303, + "mean_norm/layer16": 9.43696254491806, + "mean_norm/layer17": 9.743814766407013, + "mean_norm/layer18": 9.496419370174408, + "mean_norm/layer19": 9.512612521648407, + "mean_norm/layer2": 8.479991137981415, + "mean_norm/layer20": 9.608174979686737, + "mean_norm/layer21": 9.563690483570099, + "mean_norm/layer22": 10.09063470363617, + "mean_norm/layer23": 10.060266733169556, + "mean_norm/layer3": 9.69506311416626, + "mean_norm/layer4": 9.122413873672485, + "mean_norm/layer5": 10.346292912960052, + "mean_norm/layer6": 8.86014074087143, + "mean_norm/layer7": 9.143555641174316, + "mean_norm/layer8": 9.397226512432098, + "mean_norm/layer9": 9.365448534488678, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4050 + }, + { + "epoch": 1.69, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4548821098145151, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7933807373046875, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5572, + "eval_samples_per_second": 20.853, + "eval_steps_per_second": 0.692, + "step": 4050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.71, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8114, + "max_norm": 20.25312042236328, + "max_norm/layer0": 16.780771255493164, + "max_norm/layer1": 17.454378128051758, + "max_norm/layer10": 18.746997833251953, + "max_norm/layer11": 17.710874557495117, + "max_norm/layer12": 18.502702713012695, + "max_norm/layer13": 16.42099380493164, + "max_norm/layer14": 17.885833740234375, + "max_norm/layer15": 19.495311737060547, + "max_norm/layer16": 17.204898834228516, + "max_norm/layer17": 19.27667236328125, + "max_norm/layer18": 17.681575775146484, + "max_norm/layer19": 17.363557815551758, + "max_norm/layer2": 14.722838401794434, + "max_norm/layer20": 18.501394271850586, + "max_norm/layer21": 17.964780807495117, + "max_norm/layer22": 18.162660598754883, + "max_norm/layer23": 18.065580368041992, + "max_norm/layer3": 16.761926651000977, + "max_norm/layer4": 17.149524688720703, + "max_norm/layer5": 20.25312042236328, + "max_norm/layer6": 16.114870071411133, + "max_norm/layer7": 18.13249397277832, + "max_norm/layer8": 18.5709285736084, + "max_norm/layer9": 18.23674201965332, + "mean_norm": 9.497905241946379, + "mean_norm/layer0": 9.06176507472992, + "mean_norm/layer1": 9.126475751399994, + "mean_norm/layer10": 9.429007589817047, + "mean_norm/layer11": 9.593652665615082, + "mean_norm/layer12": 9.828673005104065, + "mean_norm/layer13": 9.383624970912933, + "mean_norm/layer14": 9.623692214488983, + "mean_norm/layer15": 9.786072611808777, + "mean_norm/layer16": 9.44901967048645, + "mean_norm/layer17": 9.758347272872925, + "mean_norm/layer18": 9.50903469324112, + "mean_norm/layer19": 9.525338292121887, + "mean_norm/layer2": 8.483352661132812, + "mean_norm/layer20": 9.621620059013367, + "mean_norm/layer21": 9.576579630374908, + "mean_norm/layer22": 10.108359515666962, + "mean_norm/layer23": 10.077474415302277, + "mean_norm/layer3": 9.708677530288696, + "mean_norm/layer4": 9.130702793598175, + "mean_norm/layer5": 10.365319192409515, + "mean_norm/layer6": 8.866493701934814, + "mean_norm/layer7": 9.152141213417053, + "mean_norm/layer8": 9.4082390666008, + "mean_norm/layer9": 9.376062214374542, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4100 + }, + { + "epoch": 1.71, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45488616590209413, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.791409730911255, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8171, + "eval_samples_per_second": 20.394, + "eval_steps_per_second": 0.677, + "step": 4100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.73, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8119, + "max_norm": 20.371471405029297, + "max_norm/layer0": 16.874263763427734, + "max_norm/layer1": 17.524900436401367, + "max_norm/layer10": 18.839059829711914, + "max_norm/layer11": 17.782032012939453, + "max_norm/layer12": 18.594261169433594, + "max_norm/layer13": 16.51697540283203, + "max_norm/layer14": 17.984203338623047, + "max_norm/layer15": 19.61891746520996, + "max_norm/layer16": 17.298097610473633, + "max_norm/layer17": 19.423992156982422, + "max_norm/layer18": 17.77617073059082, + "max_norm/layer19": 17.44768524169922, + "max_norm/layer2": 14.78378677368164, + "max_norm/layer20": 18.631628036499023, + "max_norm/layer21": 18.048566818237305, + "max_norm/layer22": 18.257789611816406, + "max_norm/layer23": 18.17466926574707, + "max_norm/layer3": 16.853816986083984, + "max_norm/layer4": 17.234498977661133, + "max_norm/layer5": 20.371471405029297, + "max_norm/layer6": 16.19548797607422, + "max_norm/layer7": 18.227479934692383, + "max_norm/layer8": 18.656274795532227, + "max_norm/layer9": 18.30875587463379, + "mean_norm": 9.51002257068952, + "mean_norm/layer0": 9.071641266345978, + "mean_norm/layer1": 9.136261284351349, + "mean_norm/layer10": 9.440190315246582, + "mean_norm/layer11": 9.606357514858246, + "mean_norm/layer12": 9.84403681755066, + "mean_norm/layer13": 9.395072102546692, + "mean_norm/layer14": 9.63693481683731, + "mean_norm/layer15": 9.800684869289398, + "mean_norm/layer16": 9.46108591556549, + "mean_norm/layer17": 9.77271944284439, + "mean_norm/layer18": 9.52157312631607, + "mean_norm/layer19": 9.537791013717651, + "mean_norm/layer2": 8.486609101295471, + "mean_norm/layer20": 9.634786188602448, + "mean_norm/layer21": 9.589442670345306, + "mean_norm/layer22": 10.12604534626007, + "mean_norm/layer23": 10.094537377357483, + "mean_norm/layer3": 9.722192883491516, + "mean_norm/layer4": 9.13902497291565, + "mean_norm/layer5": 10.384238183498383, + "mean_norm/layer6": 8.872731864452362, + "mean_norm/layer7": 9.16065239906311, + "mean_norm/layer8": 9.419233560562134, + "mean_norm/layer9": 9.38669866323471, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4150 + }, + { + "epoch": 1.73, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4547360906616696, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7870960235595703, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.795, + "eval_samples_per_second": 20.432, + "eval_steps_per_second": 0.678, + "step": 4150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.75, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8018, + "max_norm": 20.499284744262695, + "max_norm/layer0": 16.95836067199707, + "max_norm/layer1": 17.592952728271484, + "max_norm/layer10": 18.959768295288086, + "max_norm/layer11": 17.883838653564453, + "max_norm/layer12": 18.69440460205078, + "max_norm/layer13": 16.596149444580078, + "max_norm/layer14": 18.067346572875977, + "max_norm/layer15": 19.74480438232422, + "max_norm/layer16": 17.383577346801758, + "max_norm/layer17": 19.56295394897461, + "max_norm/layer18": 17.864219665527344, + "max_norm/layer19": 17.51543617248535, + "max_norm/layer2": 14.8399658203125, + "max_norm/layer20": 18.730480194091797, + "max_norm/layer21": 18.160423278808594, + "max_norm/layer22": 18.353191375732422, + "max_norm/layer23": 18.279525756835938, + "max_norm/layer3": 16.928646087646484, + "max_norm/layer4": 17.300979614257812, + "max_norm/layer5": 20.499284744262695, + "max_norm/layer6": 16.267253875732422, + "max_norm/layer7": 18.32831573486328, + "max_norm/layer8": 18.737327575683594, + "max_norm/layer9": 18.41295623779297, + "mean_norm": 9.522137492895126, + "mean_norm/layer0": 9.081620931625366, + "mean_norm/layer1": 9.14617645740509, + "mean_norm/layer10": 9.451456010341644, + "mean_norm/layer11": 9.61904102563858, + "mean_norm/layer12": 9.859608888626099, + "mean_norm/layer13": 9.406528949737549, + "mean_norm/layer14": 9.650117576122284, + "mean_norm/layer15": 9.815293192863464, + "mean_norm/layer16": 9.473051249980927, + "mean_norm/layer17": 9.78711074590683, + "mean_norm/layer18": 9.534133493900299, + "mean_norm/layer19": 9.550578236579895, + "mean_norm/layer2": 8.48985767364502, + "mean_norm/layer20": 9.64762568473816, + "mean_norm/layer21": 9.602255702018738, + "mean_norm/layer22": 10.143462002277374, + "mean_norm/layer23": 10.111734688282013, + "mean_norm/layer3": 9.735645592212677, + "mean_norm/layer4": 9.147038757801056, + "mean_norm/layer5": 10.40328711271286, + "mean_norm/layer6": 8.878861129283905, + "mean_norm/layer7": 9.169294118881226, + "mean_norm/layer8": 9.430241107940674, + "mean_norm/layer9": 9.397279500961304, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4200 + }, + { + "epoch": 1.75, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45517820420778526, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.786865711212158, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5849, + "eval_samples_per_second": 20.803, + "eval_steps_per_second": 0.691, + "step": 4200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.77, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8143, + "max_norm": 20.623327255249023, + "max_norm/layer0": 17.0467529296875, + "max_norm/layer1": 17.657014846801758, + "max_norm/layer10": 19.062538146972656, + "max_norm/layer11": 17.97028923034668, + "max_norm/layer12": 18.820533752441406, + "max_norm/layer13": 16.673133850097656, + "max_norm/layer14": 18.132125854492188, + "max_norm/layer15": 19.867862701416016, + "max_norm/layer16": 17.479171752929688, + "max_norm/layer17": 19.690410614013672, + "max_norm/layer18": 17.983844757080078, + "max_norm/layer19": 17.591114044189453, + "max_norm/layer2": 14.908049583435059, + "max_norm/layer20": 18.829238891601562, + "max_norm/layer21": 18.25043487548828, + "max_norm/layer22": 18.438114166259766, + "max_norm/layer23": 18.365001678466797, + "max_norm/layer3": 17.014738082885742, + "max_norm/layer4": 17.379840850830078, + "max_norm/layer5": 20.623327255249023, + "max_norm/layer6": 16.337890625, + "max_norm/layer7": 18.422710418701172, + "max_norm/layer8": 18.845876693725586, + "max_norm/layer9": 18.491403579711914, + "mean_norm": 9.534027844667435, + "mean_norm/layer0": 9.091397941112518, + "mean_norm/layer1": 9.155806422233582, + "mean_norm/layer10": 9.462554395198822, + "mean_norm/layer11": 9.631404340267181, + "mean_norm/layer12": 9.874627470970154, + "mean_norm/layer13": 9.417701601982117, + "mean_norm/layer14": 9.662891149520874, + "mean_norm/layer15": 9.829482555389404, + "mean_norm/layer16": 9.484811902046204, + "mean_norm/layer17": 9.801213920116425, + "mean_norm/layer18": 9.546473264694214, + "mean_norm/layer19": 9.563193321228027, + "mean_norm/layer2": 8.493122577667236, + "mean_norm/layer20": 9.660223424434662, + "mean_norm/layer21": 9.61464524269104, + "mean_norm/layer22": 10.160698652267456, + "mean_norm/layer23": 10.12846302986145, + "mean_norm/layer3": 9.748984336853027, + "mean_norm/layer4": 9.155107080936432, + "mean_norm/layer5": 10.422005653381348, + "mean_norm/layer6": 8.88517153263092, + "mean_norm/layer7": 9.177704691886902, + "mean_norm/layer8": 9.441220581531525, + "mean_norm/layer9": 9.407763183116913, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4250 + }, + { + "epoch": 1.77, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45527960639726134, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7823808193206787, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8168, + "eval_samples_per_second": 20.395, + "eval_steps_per_second": 0.677, + "step": 4250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.8, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.801, + "max_norm": 20.759300231933594, + "max_norm/layer0": 17.134748458862305, + "max_norm/layer1": 17.7257137298584, + "max_norm/layer10": 19.151565551757812, + "max_norm/layer11": 18.056488037109375, + "max_norm/layer12": 18.92339324951172, + "max_norm/layer13": 16.7547664642334, + "max_norm/layer14": 18.19631004333496, + "max_norm/layer15": 19.982650756835938, + "max_norm/layer16": 17.59579849243164, + "max_norm/layer17": 19.820369720458984, + "max_norm/layer18": 18.083040237426758, + "max_norm/layer19": 17.67841911315918, + "max_norm/layer2": 14.976433753967285, + "max_norm/layer20": 18.92435646057129, + "max_norm/layer21": 18.350635528564453, + "max_norm/layer22": 18.53485679626465, + "max_norm/layer23": 18.46183967590332, + "max_norm/layer3": 17.098966598510742, + "max_norm/layer4": 17.442232131958008, + "max_norm/layer5": 20.759300231933594, + "max_norm/layer6": 16.3858699798584, + "max_norm/layer7": 18.518962860107422, + "max_norm/layer8": 18.962594985961914, + "max_norm/layer9": 18.582992553710938, + "mean_norm": 9.545886618395647, + "mean_norm/layer0": 9.101129949092865, + "mean_norm/layer1": 9.165426433086395, + "mean_norm/layer10": 9.47351598739624, + "mean_norm/layer11": 9.643661797046661, + "mean_norm/layer12": 9.889671385288239, + "mean_norm/layer13": 9.428849935531616, + "mean_norm/layer14": 9.675801992416382, + "mean_norm/layer15": 9.84381878376007, + "mean_norm/layer16": 9.496441066265106, + "mean_norm/layer17": 9.815237402915955, + "mean_norm/layer18": 9.558767795562744, + "mean_norm/layer19": 9.57570618391037, + "mean_norm/layer2": 8.496287822723389, + "mean_norm/layer20": 9.672922849655151, + "mean_norm/layer21": 9.62732309103012, + "mean_norm/layer22": 10.17811006307602, + "mean_norm/layer23": 10.145203053951263, + "mean_norm/layer3": 9.76219356060028, + "mean_norm/layer4": 9.163109600543976, + "mean_norm/layer5": 10.44065660238266, + "mean_norm/layer6": 8.89125519990921, + "mean_norm/layer7": 9.186071753501892, + "mean_norm/layer8": 9.452130377292633, + "mean_norm/layer9": 9.417986154556274, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4300 + }, + { + "epoch": 1.8, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45536884032400027, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.780466318130493, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5429, + "eval_samples_per_second": 20.879, + "eval_steps_per_second": 0.693, + "step": 4300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.82, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8073, + "max_norm": 20.906658172607422, + "max_norm/layer0": 17.20047378540039, + "max_norm/layer1": 17.7962703704834, + "max_norm/layer10": 19.260923385620117, + "max_norm/layer11": 18.1672306060791, + "max_norm/layer12": 19.01469612121582, + "max_norm/layer13": 16.84528923034668, + "max_norm/layer14": 18.279903411865234, + "max_norm/layer15": 20.088977813720703, + "max_norm/layer16": 17.689979553222656, + "max_norm/layer17": 19.94285774230957, + "max_norm/layer18": 18.162460327148438, + "max_norm/layer19": 17.780181884765625, + "max_norm/layer2": 15.040743827819824, + "max_norm/layer20": 19.01894187927246, + "max_norm/layer21": 18.461332321166992, + "max_norm/layer22": 18.63921546936035, + "max_norm/layer23": 18.553007125854492, + "max_norm/layer3": 17.176898956298828, + "max_norm/layer4": 17.507030487060547, + "max_norm/layer5": 20.906658172607422, + "max_norm/layer6": 16.445636749267578, + "max_norm/layer7": 18.60109519958496, + "max_norm/layer8": 19.051607131958008, + "max_norm/layer9": 18.66645622253418, + "mean_norm": 9.557600170373917, + "mean_norm/layer0": 9.110860824584961, + "mean_norm/layer1": 9.175042450428009, + "mean_norm/layer10": 9.484363615512848, + "mean_norm/layer11": 9.655846178531647, + "mean_norm/layer12": 9.904585361480713, + "mean_norm/layer13": 9.43986588716507, + "mean_norm/layer14": 9.688460767269135, + "mean_norm/layer15": 9.85785061120987, + "mean_norm/layer16": 9.508097112178802, + "mean_norm/layer17": 9.829115748405457, + "mean_norm/layer18": 9.570830702781677, + "mean_norm/layer19": 9.58799260854721, + "mean_norm/layer2": 8.499535202980042, + "mean_norm/layer20": 9.685294151306152, + "mean_norm/layer21": 9.63974541425705, + "mean_norm/layer22": 10.195148229598999, + "mean_norm/layer23": 10.16170072555542, + "mean_norm/layer3": 9.775292813777924, + "mean_norm/layer4": 9.170989692211151, + "mean_norm/layer5": 10.459139466285706, + "mean_norm/layer6": 8.897323548793793, + "mean_norm/layer7": 9.194344580173492, + "mean_norm/layer8": 9.462877452373505, + "mean_norm/layer9": 9.428100943565369, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4350 + }, + { + "epoch": 1.82, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45615572131433463, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7751033306121826, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8372, + "eval_samples_per_second": 20.359, + "eval_steps_per_second": 0.676, + "step": 4350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.84, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7988, + "max_norm": 21.04453468322754, + "max_norm/layer0": 17.255943298339844, + "max_norm/layer1": 17.868118286132812, + "max_norm/layer10": 19.348005294799805, + "max_norm/layer11": 18.268312454223633, + "max_norm/layer12": 19.103347778320312, + "max_norm/layer13": 16.914888381958008, + "max_norm/layer14": 18.352100372314453, + "max_norm/layer15": 20.2009334564209, + "max_norm/layer16": 17.780242919921875, + "max_norm/layer17": 20.08079719543457, + "max_norm/layer18": 18.235071182250977, + "max_norm/layer19": 17.867902755737305, + "max_norm/layer2": 15.10726261138916, + "max_norm/layer20": 19.109235763549805, + "max_norm/layer21": 18.55447769165039, + "max_norm/layer22": 18.748037338256836, + "max_norm/layer23": 18.645830154418945, + "max_norm/layer3": 17.249866485595703, + "max_norm/layer4": 17.581409454345703, + "max_norm/layer5": 21.04453468322754, + "max_norm/layer6": 16.516193389892578, + "max_norm/layer7": 18.686376571655273, + "max_norm/layer8": 19.148639678955078, + "max_norm/layer9": 18.74429702758789, + "mean_norm": 9.569357293347517, + "mean_norm/layer0": 9.120525360107422, + "mean_norm/layer1": 9.184691786766052, + "mean_norm/layer10": 9.495336592197418, + "mean_norm/layer11": 9.668105900287628, + "mean_norm/layer12": 9.919475436210632, + "mean_norm/layer13": 9.45104306936264, + "mean_norm/layer14": 9.70114290714264, + "mean_norm/layer15": 9.872009038925171, + "mean_norm/layer16": 9.519804000854492, + "mean_norm/layer17": 9.842991590499878, + "mean_norm/layer18": 9.58296275138855, + "mean_norm/layer19": 9.600463032722473, + "mean_norm/layer2": 8.502758204936981, + "mean_norm/layer20": 9.69754272699356, + "mean_norm/layer21": 9.652194738388062, + "mean_norm/layer22": 10.212375521659851, + "mean_norm/layer23": 10.178341031074524, + "mean_norm/layer3": 9.788307666778564, + "mean_norm/layer4": 9.179190576076508, + "mean_norm/layer5": 10.477513015270233, + "mean_norm/layer6": 8.903360545635223, + "mean_norm/layer7": 9.202587485313416, + "mean_norm/layer8": 9.473590970039368, + "mean_norm/layer9": 9.438261091709137, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4400 + }, + { + "epoch": 1.84, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45590424388443396, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.775115489959717, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5853, + "eval_samples_per_second": 20.802, + "eval_steps_per_second": 0.691, + "step": 4400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.86, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7915, + "max_norm": 21.17486572265625, + "max_norm/layer0": 17.298419952392578, + "max_norm/layer1": 17.930343627929688, + "max_norm/layer10": 19.43759536743164, + "max_norm/layer11": 18.360822677612305, + "max_norm/layer12": 19.205596923828125, + "max_norm/layer13": 17.017274856567383, + "max_norm/layer14": 18.43059730529785, + "max_norm/layer15": 20.340652465820312, + "max_norm/layer16": 17.854707717895508, + "max_norm/layer17": 20.208559036254883, + "max_norm/layer18": 18.296897888183594, + "max_norm/layer19": 17.949644088745117, + "max_norm/layer2": 15.163930892944336, + "max_norm/layer20": 19.194684982299805, + "max_norm/layer21": 18.658071517944336, + "max_norm/layer22": 18.858280181884766, + "max_norm/layer23": 18.766464233398438, + "max_norm/layer3": 17.32754898071289, + "max_norm/layer4": 17.661903381347656, + "max_norm/layer5": 21.17486572265625, + "max_norm/layer6": 16.588512420654297, + "max_norm/layer7": 18.78378677368164, + "max_norm/layer8": 19.22671890258789, + "max_norm/layer9": 18.828065872192383, + "mean_norm": 9.58110864708821, + "mean_norm/layer0": 9.13014280796051, + "mean_norm/layer1": 9.19428437948227, + "mean_norm/layer10": 9.506189048290253, + "mean_norm/layer11": 9.68019586801529, + "mean_norm/layer12": 9.93433165550232, + "mean_norm/layer13": 9.462150931358337, + "mean_norm/layer14": 9.713736414909363, + "mean_norm/layer15": 9.886185884475708, + "mean_norm/layer16": 9.531567752361298, + "mean_norm/layer17": 9.856738686561584, + "mean_norm/layer18": 9.595190525054932, + "mean_norm/layer19": 9.612755954265594, + "mean_norm/layer2": 8.505994141101837, + "mean_norm/layer20": 9.709813356399536, + "mean_norm/layer21": 9.664562940597534, + "mean_norm/layer22": 10.22979611158371, + "mean_norm/layer23": 10.195049226284027, + "mean_norm/layer3": 9.801417529582977, + "mean_norm/layer4": 9.187121748924255, + "mean_norm/layer5": 10.495978653430939, + "mean_norm/layer6": 8.909496486186981, + "mean_norm/layer7": 9.211061120033264, + "mean_norm/layer8": 9.48429411649704, + "mean_norm/layer9": 9.448552191257477, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4450 + }, + { + "epoch": 1.86, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45618005783980886, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7739932537078857, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8201, + "eval_samples_per_second": 20.389, + "eval_steps_per_second": 0.677, + "step": 4450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.88, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.8088, + "max_norm": 21.288240432739258, + "max_norm/layer0": 17.345314025878906, + "max_norm/layer1": 18.00452423095703, + "max_norm/layer10": 19.536436080932617, + "max_norm/layer11": 18.446500778198242, + "max_norm/layer12": 19.339845657348633, + "max_norm/layer13": 17.11781120300293, + "max_norm/layer14": 18.51311683654785, + "max_norm/layer15": 20.480234146118164, + "max_norm/layer16": 17.940902709960938, + "max_norm/layer17": 20.350200653076172, + "max_norm/layer18": 18.398128509521484, + "max_norm/layer19": 18.029136657714844, + "max_norm/layer2": 15.231613159179688, + "max_norm/layer20": 19.287769317626953, + "max_norm/layer21": 18.776599884033203, + "max_norm/layer22": 18.979724884033203, + "max_norm/layer23": 18.858877182006836, + "max_norm/layer3": 17.388498306274414, + "max_norm/layer4": 17.775165557861328, + "max_norm/layer5": 21.288240432739258, + "max_norm/layer6": 16.653141021728516, + "max_norm/layer7": 18.898910522460938, + "max_norm/layer8": 19.32200050354004, + "max_norm/layer9": 18.906003952026367, + "mean_norm": 9.592867535849413, + "mean_norm/layer0": 9.139825999736786, + "mean_norm/layer1": 9.20407783985138, + "mean_norm/layer10": 9.517067611217499, + "mean_norm/layer11": 9.692343294620514, + "mean_norm/layer12": 9.94935166835785, + "mean_norm/layer13": 9.473208963871002, + "mean_norm/layer14": 9.726474404335022, + "mean_norm/layer15": 9.900470495223999, + "mean_norm/layer16": 9.54332023859024, + "mean_norm/layer17": 9.870534479618073, + "mean_norm/layer18": 9.60720431804657, + "mean_norm/layer19": 9.625152111053467, + "mean_norm/layer2": 8.509223759174347, + "mean_norm/layer20": 9.722173869609833, + "mean_norm/layer21": 9.67687976360321, + "mean_norm/layer22": 10.246850192546844, + "mean_norm/layer23": 10.211505055427551, + "mean_norm/layer3": 9.814597129821777, + "mean_norm/layer4": 9.194973826408386, + "mean_norm/layer5": 10.514500916004181, + "mean_norm/layer6": 8.915790915489197, + "mean_norm/layer7": 9.219484984874725, + "mean_norm/layer8": 9.49491000175476, + "mean_norm/layer9": 9.458899021148682, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4500 + }, + { + "epoch": 1.88, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.456188170014967, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7761588096618652, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8106, + "eval_samples_per_second": 20.405, + "eval_steps_per_second": 0.677, + "step": 4500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.9, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7959, + "max_norm": 21.412240982055664, + "max_norm/layer0": 17.401063919067383, + "max_norm/layer1": 18.084028244018555, + "max_norm/layer10": 19.634403228759766, + "max_norm/layer11": 18.531543731689453, + "max_norm/layer12": 19.471622467041016, + "max_norm/layer13": 17.196971893310547, + "max_norm/layer14": 18.595664978027344, + "max_norm/layer15": 20.628389358520508, + "max_norm/layer16": 18.04037857055664, + "max_norm/layer17": 20.481491088867188, + "max_norm/layer18": 18.486473083496094, + "max_norm/layer19": 18.102190017700195, + "max_norm/layer2": 15.300971031188965, + "max_norm/layer20": 19.38399887084961, + "max_norm/layer21": 18.876100540161133, + "max_norm/layer22": 19.10553550720215, + "max_norm/layer23": 18.965547561645508, + "max_norm/layer3": 17.45551872253418, + "max_norm/layer4": 17.88532066345215, + "max_norm/layer5": 21.412240982055664, + "max_norm/layer6": 16.702308654785156, + "max_norm/layer7": 19.0312442779541, + "max_norm/layer8": 19.416467666625977, + "max_norm/layer9": 19.000038146972656, + "mean_norm": 9.60454748570919, + "mean_norm/layer0": 9.149442195892334, + "mean_norm/layer1": 9.213627398014069, + "mean_norm/layer10": 9.527814865112305, + "mean_norm/layer11": 9.704487025737762, + "mean_norm/layer12": 9.964283287525177, + "mean_norm/layer13": 9.484197497367859, + "mean_norm/layer14": 9.73909717798233, + "mean_norm/layer15": 9.914574265480042, + "mean_norm/layer16": 9.55492353439331, + "mean_norm/layer17": 9.884373843669891, + "mean_norm/layer18": 9.619216859340668, + "mean_norm/layer19": 9.637514412403107, + "mean_norm/layer2": 8.512493133544922, + "mean_norm/layer20": 9.734349429607391, + "mean_norm/layer21": 9.689200222492218, + "mean_norm/layer22": 10.263882875442505, + "mean_norm/layer23": 10.227949321269989, + "mean_norm/layer3": 9.827821612358093, + "mean_norm/layer4": 9.202875196933746, + "mean_norm/layer5": 10.532879412174225, + "mean_norm/layer6": 8.921751141548157, + "mean_norm/layer7": 9.227769911289215, + "mean_norm/layer8": 9.505604028701782, + "mean_norm/layer9": 9.469011008739471, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4550 + }, + { + "epoch": 1.9, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4568898731661414, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.768836259841919, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5533, + "eval_samples_per_second": 20.86, + "eval_steps_per_second": 0.692, + "step": 4550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.92, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7942, + "max_norm": 21.53392791748047, + "max_norm/layer0": 17.465423583984375, + "max_norm/layer1": 18.17967414855957, + "max_norm/layer10": 19.711856842041016, + "max_norm/layer11": 18.609466552734375, + "max_norm/layer12": 19.569843292236328, + "max_norm/layer13": 17.279605865478516, + "max_norm/layer14": 18.686342239379883, + "max_norm/layer15": 20.776939392089844, + "max_norm/layer16": 18.130950927734375, + "max_norm/layer17": 20.6143741607666, + "max_norm/layer18": 18.57437515258789, + "max_norm/layer19": 18.213754653930664, + "max_norm/layer2": 15.358172416687012, + "max_norm/layer20": 19.491958618164062, + "max_norm/layer21": 18.976621627807617, + "max_norm/layer22": 19.238208770751953, + "max_norm/layer23": 19.04021644592285, + "max_norm/layer3": 17.52911376953125, + "max_norm/layer4": 17.98028564453125, + "max_norm/layer5": 21.53392791748047, + "max_norm/layer6": 16.75553321838379, + "max_norm/layer7": 19.121355056762695, + "max_norm/layer8": 19.50104522705078, + "max_norm/layer9": 19.088035583496094, + "mean_norm": 9.616017671922842, + "mean_norm/layer0": 9.158940315246582, + "mean_norm/layer1": 9.223099112510681, + "mean_norm/layer10": 9.538458824157715, + "mean_norm/layer11": 9.716457784175873, + "mean_norm/layer12": 9.978936910629272, + "mean_norm/layer13": 9.49501234292984, + "mean_norm/layer14": 9.751602709293365, + "mean_norm/layer15": 9.92855703830719, + "mean_norm/layer16": 9.566272795200348, + "mean_norm/layer17": 9.897848546504974, + "mean_norm/layer18": 9.630900084972382, + "mean_norm/layer19": 9.649376332759857, + "mean_norm/layer2": 8.51567929983139, + "mean_norm/layer20": 9.746204793453217, + "mean_norm/layer21": 9.70108163356781, + "mean_norm/layer22": 10.280311226844788, + "mean_norm/layer23": 10.244093477725983, + "mean_norm/layer3": 9.840932130813599, + "mean_norm/layer4": 9.21077847480774, + "mean_norm/layer5": 10.55105346441269, + "mean_norm/layer6": 8.927722990512848, + "mean_norm/layer7": 9.2358558177948, + "mean_norm/layer8": 9.51610243320465, + "mean_norm/layer9": 9.479145586490631, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4600 + }, + { + "epoch": 1.92, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45723058452278104, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7702465057373047, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8086, + "eval_samples_per_second": 20.409, + "eval_steps_per_second": 0.677, + "step": 4600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.94, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7986, + "max_norm": 21.668651580810547, + "max_norm/layer0": 17.538354873657227, + "max_norm/layer1": 18.273357391357422, + "max_norm/layer10": 19.79624366760254, + "max_norm/layer11": 18.679546356201172, + "max_norm/layer12": 19.675004959106445, + "max_norm/layer13": 17.357282638549805, + "max_norm/layer14": 18.773691177368164, + "max_norm/layer15": 20.872743606567383, + "max_norm/layer16": 18.211257934570312, + "max_norm/layer17": 20.737648010253906, + "max_norm/layer18": 18.65184211730957, + "max_norm/layer19": 18.335451126098633, + "max_norm/layer2": 15.420967102050781, + "max_norm/layer20": 19.6021728515625, + "max_norm/layer21": 19.084949493408203, + "max_norm/layer22": 19.35108184814453, + "max_norm/layer23": 19.116403579711914, + "max_norm/layer3": 17.621381759643555, + "max_norm/layer4": 18.06914710998535, + "max_norm/layer5": 21.668651580810547, + "max_norm/layer6": 16.80304718017578, + "max_norm/layer7": 19.21202850341797, + "max_norm/layer8": 19.5865421295166, + "max_norm/layer9": 19.177453994750977, + "mean_norm": 9.62727957467238, + "mean_norm/layer0": 9.16827380657196, + "mean_norm/layer1": 9.232361853122711, + "mean_norm/layer10": 9.549022853374481, + "mean_norm/layer11": 9.728195488452911, + "mean_norm/layer12": 9.993273079395294, + "mean_norm/layer13": 9.505652070045471, + "mean_norm/layer14": 9.763936638832092, + "mean_norm/layer15": 9.942192792892456, + "mean_norm/layer16": 9.577354550361633, + "mean_norm/layer17": 9.911025285720825, + "mean_norm/layer18": 9.642389118671417, + "mean_norm/layer19": 9.660954356193542, + "mean_norm/layer2": 8.51875525712967, + "mean_norm/layer20": 9.758077919483185, + "mean_norm/layer21": 9.712872505187988, + "mean_norm/layer22": 10.296362459659576, + "mean_norm/layer23": 10.259945154190063, + "mean_norm/layer3": 9.853806853294373, + "mean_norm/layer4": 9.218483328819275, + "mean_norm/layer5": 10.56893503665924, + "mean_norm/layer6": 8.933514535427094, + "mean_norm/layer7": 9.243833124637604, + "mean_norm/layer8": 9.526439189910889, + "mean_norm/layer9": 9.489052534103394, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4650 + }, + { + "epoch": 1.94, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45738065976320563, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7653119564056396, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8081, + "eval_samples_per_second": 20.41, + "eval_steps_per_second": 0.678, + "step": 4650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.96, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7875, + "max_norm": 21.812347412109375, + "max_norm/layer0": 17.620792388916016, + "max_norm/layer1": 18.36002540588379, + "max_norm/layer10": 19.895370483398438, + "max_norm/layer11": 18.755598068237305, + "max_norm/layer12": 19.789051055908203, + "max_norm/layer13": 17.464237213134766, + "max_norm/layer14": 18.870973587036133, + "max_norm/layer15": 20.999399185180664, + "max_norm/layer16": 18.288803100585938, + "max_norm/layer17": 20.858943939208984, + "max_norm/layer18": 18.758024215698242, + "max_norm/layer19": 18.439855575561523, + "max_norm/layer2": 15.474851608276367, + "max_norm/layer20": 19.70724868774414, + "max_norm/layer21": 19.183589935302734, + "max_norm/layer22": 19.45682716369629, + "max_norm/layer23": 19.219196319580078, + "max_norm/layer3": 17.702922821044922, + "max_norm/layer4": 18.186697006225586, + "max_norm/layer5": 21.812347412109375, + "max_norm/layer6": 16.868118286132812, + "max_norm/layer7": 19.29692268371582, + "max_norm/layer8": 19.681978225708008, + "max_norm/layer9": 19.25440788269043, + "mean_norm": 9.638825024167696, + "mean_norm/layer0": 9.17789477109909, + "mean_norm/layer1": 9.24189579486847, + "mean_norm/layer10": 9.559810936450958, + "mean_norm/layer11": 9.74020391702652, + "mean_norm/layer12": 10.008057594299316, + "mean_norm/layer13": 9.51668530702591, + "mean_norm/layer14": 9.776471257209778, + "mean_norm/layer15": 9.956155121326447, + "mean_norm/layer16": 9.58882337808609, + "mean_norm/layer17": 9.924677908420563, + "mean_norm/layer18": 9.654309391975403, + "mean_norm/layer19": 9.672747313976288, + "mean_norm/layer2": 8.521749794483185, + "mean_norm/layer20": 9.769956290721893, + "mean_norm/layer21": 9.724786639213562, + "mean_norm/layer22": 10.312981486320496, + "mean_norm/layer23": 10.276334583759308, + "mean_norm/layer3": 9.866843819618225, + "mean_norm/layer4": 9.22641772031784, + "mean_norm/layer5": 10.587312281131744, + "mean_norm/layer6": 8.939548313617706, + "mean_norm/layer7": 9.252090871334076, + "mean_norm/layer8": 9.536978244781494, + "mean_norm/layer9": 9.499067842960358, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4700 + }, + { + "epoch": 1.96, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45789578288574406, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7666313648223877, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6039, + "eval_samples_per_second": 20.769, + "eval_steps_per_second": 0.689, + "step": 4700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 1.98, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7972, + "max_norm": 21.965734481811523, + "max_norm/layer0": 17.689268112182617, + "max_norm/layer1": 18.430795669555664, + "max_norm/layer10": 19.9880428314209, + "max_norm/layer11": 18.836973190307617, + "max_norm/layer12": 19.878585815429688, + "max_norm/layer13": 17.54067039489746, + "max_norm/layer14": 18.96476173400879, + "max_norm/layer15": 21.133108139038086, + "max_norm/layer16": 18.367586135864258, + "max_norm/layer17": 20.977399826049805, + "max_norm/layer18": 18.857200622558594, + "max_norm/layer19": 18.525466918945312, + "max_norm/layer2": 15.54166316986084, + "max_norm/layer20": 19.816164016723633, + "max_norm/layer21": 19.26383399963379, + "max_norm/layer22": 19.56534194946289, + "max_norm/layer23": 19.31981086730957, + "max_norm/layer3": 17.79178810119629, + "max_norm/layer4": 18.29109764099121, + "max_norm/layer5": 21.965734481811523, + "max_norm/layer6": 16.933610916137695, + "max_norm/layer7": 19.38679313659668, + "max_norm/layer8": 19.795856475830078, + "max_norm/layer9": 19.338916778564453, + "mean_norm": 9.650136108199755, + "mean_norm/layer0": 9.18730765581131, + "mean_norm/layer1": 9.251254618167877, + "mean_norm/layer10": 9.570415079593658, + "mean_norm/layer11": 9.752062618732452, + "mean_norm/layer12": 10.022457659244537, + "mean_norm/layer13": 9.527392983436584, + "mean_norm/layer14": 9.788740396499634, + "mean_norm/layer15": 9.969760477542877, + "mean_norm/layer16": 9.600076735019684, + "mean_norm/layer17": 9.938059866428375, + "mean_norm/layer18": 9.66584461927414, + "mean_norm/layer19": 9.68437534570694, + "mean_norm/layer2": 8.524769961833954, + "mean_norm/layer20": 9.78183799982071, + "mean_norm/layer21": 9.736468076705933, + "mean_norm/layer22": 10.328970611095428, + "mean_norm/layer23": 10.292193472385406, + "mean_norm/layer3": 9.879729330539703, + "mean_norm/layer4": 9.234225153923035, + "mean_norm/layer5": 10.605308294296265, + "mean_norm/layer6": 8.945447742938995, + "mean_norm/layer7": 9.260186851024628, + "mean_norm/layer8": 9.547355473041534, + "mean_norm/layer9": 9.509025573730469, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4750 + }, + { + "epoch": 1.98, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4573968841135218, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7658636569976807, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5352, + "eval_samples_per_second": 20.893, + "eval_steps_per_second": 0.694, + "step": 4750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.0, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.7549, + "max_norm": 22.097200393676758, + "max_norm/layer0": 17.7503719329834, + "max_norm/layer1": 18.497804641723633, + "max_norm/layer10": 20.086458206176758, + "max_norm/layer11": 18.916461944580078, + "max_norm/layer12": 19.985445022583008, + "max_norm/layer13": 17.607402801513672, + "max_norm/layer14": 19.063182830810547, + "max_norm/layer15": 21.26007080078125, + "max_norm/layer16": 18.455631256103516, + "max_norm/layer17": 21.091989517211914, + "max_norm/layer18": 18.967914581298828, + "max_norm/layer19": 18.608983993530273, + "max_norm/layer2": 15.61719036102295, + "max_norm/layer20": 19.923967361450195, + "max_norm/layer21": 19.351205825805664, + "max_norm/layer22": 19.670289993286133, + "max_norm/layer23": 19.406200408935547, + "max_norm/layer3": 17.88211441040039, + "max_norm/layer4": 18.38958168029785, + "max_norm/layer5": 22.097200393676758, + "max_norm/layer6": 16.993507385253906, + "max_norm/layer7": 19.465435028076172, + "max_norm/layer8": 19.875547409057617, + "max_norm/layer9": 19.429819107055664, + "mean_norm": 9.661303776005903, + "mean_norm/layer0": 9.196622729301453, + "mean_norm/layer1": 9.260469496250153, + "mean_norm/layer10": 9.580876767635345, + "mean_norm/layer11": 9.763825356960297, + "mean_norm/layer12": 10.036564350128174, + "mean_norm/layer13": 9.537844955921173, + "mean_norm/layer14": 9.800962150096893, + "mean_norm/layer15": 9.983208060264587, + "mean_norm/layer16": 9.61099511384964, + "mean_norm/layer17": 9.951125979423523, + "mean_norm/layer18": 9.677132070064545, + "mean_norm/layer19": 9.695655643939972, + "mean_norm/layer2": 8.52772867679596, + "mean_norm/layer20": 9.793645083904266, + "mean_norm/layer21": 9.748089730739594, + "mean_norm/layer22": 10.345001339912415, + "mean_norm/layer23": 10.307753026485443, + "mean_norm/layer3": 9.892489731311798, + "mean_norm/layer4": 9.24187582731247, + "mean_norm/layer5": 10.623258709907532, + "mean_norm/layer6": 8.951395571231842, + "mean_norm/layer7": 9.2682363986969, + "mean_norm/layer8": 9.557595670223236, + "mean_norm/layer9": 9.518938183784485, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4800 + }, + { + "epoch": 2.0, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4563869183063401, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.770103693008423, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7952, + "eval_samples_per_second": 20.432, + "eval_steps_per_second": 0.678, + "step": 4800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.03, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6161, + "max_norm": 22.229122161865234, + "max_norm/layer0": 17.81972312927246, + "max_norm/layer1": 18.582639694213867, + "max_norm/layer10": 20.194303512573242, + "max_norm/layer11": 18.99195671081543, + "max_norm/layer12": 20.07562828063965, + "max_norm/layer13": 17.683574676513672, + "max_norm/layer14": 19.15118408203125, + "max_norm/layer15": 21.398839950561523, + "max_norm/layer16": 18.56853485107422, + "max_norm/layer17": 21.212589263916016, + "max_norm/layer18": 19.053190231323242, + "max_norm/layer19": 18.710668563842773, + "max_norm/layer2": 15.681137084960938, + "max_norm/layer20": 20.02528190612793, + "max_norm/layer21": 19.46278190612793, + "max_norm/layer22": 19.791105270385742, + "max_norm/layer23": 19.512958526611328, + "max_norm/layer3": 17.977426528930664, + "max_norm/layer4": 18.481155395507812, + "max_norm/layer5": 22.229122161865234, + "max_norm/layer6": 17.07346534729004, + "max_norm/layer7": 19.551734924316406, + "max_norm/layer8": 19.978107452392578, + "max_norm/layer9": 19.52581024169922, + "mean_norm": 9.67351096123457, + "mean_norm/layer0": 9.206518650054932, + "mean_norm/layer1": 9.270343840122223, + "mean_norm/layer10": 9.592012703418732, + "mean_norm/layer11": 9.776739001274109, + "mean_norm/layer12": 10.052140772342682, + "mean_norm/layer13": 9.54944109916687, + "mean_norm/layer14": 9.814337015151978, + "mean_norm/layer15": 9.998102486133575, + "mean_norm/layer16": 9.623249113559723, + "mean_norm/layer17": 9.965643167495728, + "mean_norm/layer18": 9.68981283903122, + "mean_norm/layer19": 9.708701848983765, + "mean_norm/layer2": 8.53110545873642, + "mean_norm/layer20": 9.807106733322144, + "mean_norm/layer21": 9.761286437511444, + "mean_norm/layer22": 10.362047135829926, + "mean_norm/layer23": 10.32488340139389, + "mean_norm/layer3": 9.906088292598724, + "mean_norm/layer4": 9.250157296657562, + "mean_norm/layer5": 10.641968488693237, + "mean_norm/layer6": 8.957864344120026, + "mean_norm/layer7": 9.276767492294312, + "mean_norm/layer8": 9.56849718093872, + "mean_norm/layer9": 9.52944827079773, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4850 + }, + { + "epoch": 2.03, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4569547705674061, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7753307819366455, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5422, + "eval_samples_per_second": 20.88, + "eval_steps_per_second": 0.693, + "step": 4850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.05, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6189, + "max_norm": 22.367904663085938, + "max_norm/layer0": 17.887420654296875, + "max_norm/layer1": 18.671733856201172, + "max_norm/layer10": 20.304906845092773, + "max_norm/layer11": 19.061819076538086, + "max_norm/layer12": 20.177019119262695, + "max_norm/layer13": 17.76485252380371, + "max_norm/layer14": 19.243499755859375, + "max_norm/layer15": 21.52268409729004, + "max_norm/layer16": 18.677610397338867, + "max_norm/layer17": 21.335845947265625, + "max_norm/layer18": 19.159006118774414, + "max_norm/layer19": 18.810163497924805, + "max_norm/layer2": 15.746746063232422, + "max_norm/layer20": 20.1280517578125, + "max_norm/layer21": 19.575899124145508, + "max_norm/layer22": 19.892805099487305, + "max_norm/layer23": 19.60469627380371, + "max_norm/layer3": 18.071157455444336, + "max_norm/layer4": 18.57114601135254, + "max_norm/layer5": 22.367904663085938, + "max_norm/layer6": 17.15428924560547, + "max_norm/layer7": 19.633804321289062, + "max_norm/layer8": 20.081315994262695, + "max_norm/layer9": 19.6232967376709, + "mean_norm": 9.685750077168146, + "mean_norm/layer0": 9.217075943946838, + "mean_norm/layer1": 9.280148386955261, + "mean_norm/layer10": 9.603125274181366, + "mean_norm/layer11": 9.789462864398956, + "mean_norm/layer12": 10.067663490772247, + "mean_norm/layer13": 9.561099231243134, + "mean_norm/layer14": 9.827849328517914, + "mean_norm/layer15": 10.012909770011902, + "mean_norm/layer16": 9.635309100151062, + "mean_norm/layer17": 9.979934573173523, + "mean_norm/layer18": 9.702326834201813, + "mean_norm/layer19": 9.721765398979187, + "mean_norm/layer2": 8.534556448459625, + "mean_norm/layer20": 9.820671617984772, + "mean_norm/layer21": 9.774718105793, + "mean_norm/layer22": 10.379175782203674, + "mean_norm/layer23": 10.342072427272797, + "mean_norm/layer3": 9.919848799705505, + "mean_norm/layer4": 9.25857150554657, + "mean_norm/layer5": 10.660731792449951, + "mean_norm/layer6": 8.964467108249664, + "mean_norm/layer7": 9.285303235054016, + "mean_norm/layer8": 9.579225778579712, + "mean_norm/layer9": 9.539989054203033, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4900 + }, + { + "epoch": 2.05, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45636663786844484, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.778195858001709, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5841, + "eval_samples_per_second": 20.804, + "eval_steps_per_second": 0.691, + "step": 4900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.07, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6266, + "max_norm": 22.497936248779297, + "max_norm/layer0": 17.95612144470215, + "max_norm/layer1": 18.766647338867188, + "max_norm/layer10": 20.393529891967773, + "max_norm/layer11": 19.140981674194336, + "max_norm/layer12": 20.30097198486328, + "max_norm/layer13": 17.845705032348633, + "max_norm/layer14": 19.33021354675293, + "max_norm/layer15": 21.635671615600586, + "max_norm/layer16": 18.780454635620117, + "max_norm/layer17": 21.467220306396484, + "max_norm/layer18": 19.249921798706055, + "max_norm/layer19": 18.916114807128906, + "max_norm/layer2": 15.8043794631958, + "max_norm/layer20": 20.2207088470459, + "max_norm/layer21": 19.68240737915039, + "max_norm/layer22": 20.003076553344727, + "max_norm/layer23": 19.702362060546875, + "max_norm/layer3": 18.159029006958008, + "max_norm/layer4": 18.67041015625, + "max_norm/layer5": 22.497936248779297, + "max_norm/layer6": 17.22257423400879, + "max_norm/layer7": 19.70867156982422, + "max_norm/layer8": 20.17713165283203, + "max_norm/layer9": 19.7199764251709, + "mean_norm": 9.698031273980936, + "mean_norm/layer0": 9.2280832529068, + "mean_norm/layer1": 9.29011619091034, + "mean_norm/layer10": 9.614328265190125, + "mean_norm/layer11": 9.802447438240051, + "mean_norm/layer12": 10.083309292793274, + "mean_norm/layer13": 9.572734773159027, + "mean_norm/layer14": 9.841307997703552, + "mean_norm/layer15": 10.027710676193237, + "mean_norm/layer16": 9.647395431995392, + "mean_norm/layer17": 9.994074761867523, + "mean_norm/layer18": 9.714804410934448, + "mean_norm/layer19": 9.73473072052002, + "mean_norm/layer2": 8.538142025470734, + "mean_norm/layer20": 9.833818078041077, + "mean_norm/layer21": 9.787812173366547, + "mean_norm/layer22": 10.39659869670868, + "mean_norm/layer23": 10.359000742435455, + "mean_norm/layer3": 9.933819353580475, + "mean_norm/layer4": 9.267073810100555, + "mean_norm/layer5": 10.679556548595428, + "mean_norm/layer6": 8.971089124679565, + "mean_norm/layer7": 9.293950021266937, + "mean_norm/layer8": 9.59020709991455, + "mean_norm/layer9": 9.550639688968658, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 4950 + }, + { + "epoch": 2.07, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45755507152910446, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.778442859649658, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.7905, + "eval_samples_per_second": 22.334, + "eval_steps_per_second": 0.741, + "step": 4950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.09, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6468, + "max_norm": 22.62725257873535, + "max_norm/layer0": 18.031448364257812, + "max_norm/layer1": 18.85249137878418, + "max_norm/layer10": 20.487457275390625, + "max_norm/layer11": 19.27031898498535, + "max_norm/layer12": 20.434553146362305, + "max_norm/layer13": 17.91874122619629, + "max_norm/layer14": 19.41231346130371, + "max_norm/layer15": 21.761850357055664, + "max_norm/layer16": 18.886045455932617, + "max_norm/layer17": 21.617713928222656, + "max_norm/layer18": 19.34942626953125, + "max_norm/layer19": 19.026630401611328, + "max_norm/layer2": 15.86556339263916, + "max_norm/layer20": 20.321598052978516, + "max_norm/layer21": 19.79185676574707, + "max_norm/layer22": 20.136564254760742, + "max_norm/layer23": 19.804283142089844, + "max_norm/layer3": 18.258943557739258, + "max_norm/layer4": 18.755266189575195, + "max_norm/layer5": 22.62725257873535, + "max_norm/layer6": 17.279165267944336, + "max_norm/layer7": 19.7928466796875, + "max_norm/layer8": 20.278255462646484, + "max_norm/layer9": 19.814647674560547, + "mean_norm": 9.71029263238112, + "mean_norm/layer0": 9.239352583885193, + "mean_norm/layer1": 9.300042927265167, + "mean_norm/layer10": 9.625477373600006, + "mean_norm/layer11": 9.815385699272156, + "mean_norm/layer12": 10.098966121673584, + "mean_norm/layer13": 9.584208488464355, + "mean_norm/layer14": 9.854663968086243, + "mean_norm/layer15": 10.042455911636353, + "mean_norm/layer16": 9.659296989440918, + "mean_norm/layer17": 10.008129358291626, + "mean_norm/layer18": 9.727139055728912, + "mean_norm/layer19": 9.74753886461258, + "mean_norm/layer2": 8.541776299476624, + "mean_norm/layer20": 9.846904814243317, + "mean_norm/layer21": 9.800666272640228, + "mean_norm/layer22": 10.414086759090424, + "mean_norm/layer23": 10.375837922096252, + "mean_norm/layer3": 9.947814524173737, + "mean_norm/layer4": 9.275640845298767, + "mean_norm/layer5": 10.698535740375519, + "mean_norm/layer6": 8.977764904499054, + "mean_norm/layer7": 9.302622854709625, + "mean_norm/layer8": 9.601214170455933, + "mean_norm/layer9": 9.56150072813034, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5000 + }, + { + "epoch": 2.09, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4572954819240457, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7788991928100586, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8093, + "eval_samples_per_second": 20.408, + "eval_steps_per_second": 0.677, + "step": 5000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.11, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6487, + "max_norm": 22.76466941833496, + "max_norm/layer0": 18.100759506225586, + "max_norm/layer1": 18.94605827331543, + "max_norm/layer10": 20.581647872924805, + "max_norm/layer11": 19.369783401489258, + "max_norm/layer12": 20.52696990966797, + "max_norm/layer13": 17.98175048828125, + "max_norm/layer14": 19.488126754760742, + "max_norm/layer15": 21.85770034790039, + "max_norm/layer16": 18.97614860534668, + "max_norm/layer17": 21.745214462280273, + "max_norm/layer18": 19.442224502563477, + "max_norm/layer19": 19.127676010131836, + "max_norm/layer2": 15.919937133789062, + "max_norm/layer20": 20.431379318237305, + "max_norm/layer21": 19.900375366210938, + "max_norm/layer22": 20.263553619384766, + "max_norm/layer23": 19.90934181213379, + "max_norm/layer3": 18.351699829101562, + "max_norm/layer4": 18.841182708740234, + "max_norm/layer5": 22.76466941833496, + "max_norm/layer6": 17.338943481445312, + "max_norm/layer7": 19.896106719970703, + "max_norm/layer8": 20.378662109375, + "max_norm/layer9": 19.90271759033203, + "mean_norm": 9.722342488666376, + "mean_norm/layer0": 9.250700294971466, + "mean_norm/layer1": 9.309888064861298, + "mean_norm/layer10": 9.63647472858429, + "mean_norm/layer11": 9.828037559986115, + "mean_norm/layer12": 10.114314317703247, + "mean_norm/layer13": 9.595680236816406, + "mean_norm/layer14": 9.86775666475296, + "mean_norm/layer15": 10.057121217250824, + "mean_norm/layer16": 9.671030879020691, + "mean_norm/layer17": 10.021993637084961, + "mean_norm/layer18": 9.739132702350616, + "mean_norm/layer19": 9.759905397891998, + "mean_norm/layer2": 8.54540067911148, + "mean_norm/layer20": 9.859400808811188, + "mean_norm/layer21": 9.81334936618805, + "mean_norm/layer22": 10.431015074253082, + "mean_norm/layer23": 10.392397820949554, + "mean_norm/layer3": 9.961604416370392, + "mean_norm/layer4": 9.284013032913208, + "mean_norm/layer5": 10.717323243618011, + "mean_norm/layer6": 8.984280347824097, + "mean_norm/layer7": 9.311186790466309, + "mean_norm/layer8": 9.612077295780182, + "mean_norm/layer9": 9.572135150432587, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5050 + }, + { + "epoch": 2.11, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45699938753077557, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7762091159820557, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8214, + "eval_samples_per_second": 20.387, + "eval_steps_per_second": 0.677, + "step": 5050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.13, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6467, + "max_norm": 22.89735984802246, + "max_norm/layer0": 18.166860580444336, + "max_norm/layer1": 19.054595947265625, + "max_norm/layer10": 20.66739845275879, + "max_norm/layer11": 19.451705932617188, + "max_norm/layer12": 20.62177848815918, + "max_norm/layer13": 18.060523986816406, + "max_norm/layer14": 19.57383155822754, + "max_norm/layer15": 21.97449493408203, + "max_norm/layer16": 19.052349090576172, + "max_norm/layer17": 21.87696647644043, + "max_norm/layer18": 19.54570770263672, + "max_norm/layer19": 19.23660659790039, + "max_norm/layer2": 15.98861026763916, + "max_norm/layer20": 20.53759002685547, + "max_norm/layer21": 20.000146865844727, + "max_norm/layer22": 20.37427520751953, + "max_norm/layer23": 20.004507064819336, + "max_norm/layer3": 18.47233772277832, + "max_norm/layer4": 18.915876388549805, + "max_norm/layer5": 22.89735984802246, + "max_norm/layer6": 17.400609970092773, + "max_norm/layer7": 19.98491668701172, + "max_norm/layer8": 20.48213005065918, + "max_norm/layer9": 20.012739181518555, + "mean_norm": 9.734544103344282, + "mean_norm/layer0": 9.2623251080513, + "mean_norm/layer1": 9.320045828819275, + "mean_norm/layer10": 9.647578060626984, + "mean_norm/layer11": 9.840642750263214, + "mean_norm/layer12": 10.129788398742676, + "mean_norm/layer13": 9.607102155685425, + "mean_norm/layer14": 9.88111037015915, + "mean_norm/layer15": 10.071675181388855, + "mean_norm/layer16": 9.682976722717285, + "mean_norm/layer17": 10.03602159023285, + "mean_norm/layer18": 9.751314342021942, + "mean_norm/layer19": 9.7725231051445, + "mean_norm/layer2": 8.549007654190063, + "mean_norm/layer20": 9.87232106924057, + "mean_norm/layer21": 9.826198995113373, + "mean_norm/layer22": 10.448007762432098, + "mean_norm/layer23": 10.409220039844513, + "mean_norm/layer3": 9.975856363773346, + "mean_norm/layer4": 9.29235965013504, + "mean_norm/layer5": 10.736477971076965, + "mean_norm/layer6": 8.990878164768219, + "mean_norm/layer7": 9.319936335086823, + "mean_norm/layer8": 9.622983694076538, + "mean_norm/layer9": 9.582707166671753, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5100 + }, + { + "epoch": 2.13, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4562327869783364, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.777289628982544, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5722, + "eval_samples_per_second": 20.826, + "eval_steps_per_second": 0.691, + "step": 5100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.15, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6599, + "max_norm": 23.004852294921875, + "max_norm/layer0": 18.246042251586914, + "max_norm/layer1": 19.173181533813477, + "max_norm/layer10": 20.759347915649414, + "max_norm/layer11": 19.53813362121582, + "max_norm/layer12": 20.722137451171875, + "max_norm/layer13": 18.14091682434082, + "max_norm/layer14": 19.650548934936523, + "max_norm/layer15": 22.08029556274414, + "max_norm/layer16": 19.13140869140625, + "max_norm/layer17": 22.015832901000977, + "max_norm/layer18": 19.6434268951416, + "max_norm/layer19": 19.330032348632812, + "max_norm/layer2": 16.050338745117188, + "max_norm/layer20": 20.631410598754883, + "max_norm/layer21": 20.11321258544922, + "max_norm/layer22": 20.477571487426758, + "max_norm/layer23": 20.0946102142334, + "max_norm/layer3": 18.563167572021484, + "max_norm/layer4": 19.002338409423828, + "max_norm/layer5": 23.004852294921875, + "max_norm/layer6": 17.46533966064453, + "max_norm/layer7": 20.085609436035156, + "max_norm/layer8": 20.567922592163086, + "max_norm/layer9": 20.1201229095459, + "mean_norm": 9.746603799362978, + "mean_norm/layer0": 9.273974597454071, + "mean_norm/layer1": 9.330005407333374, + "mean_norm/layer10": 9.658581376075745, + "mean_norm/layer11": 9.853312253952026, + "mean_norm/layer12": 10.145055592060089, + "mean_norm/layer13": 9.618417501449585, + "mean_norm/layer14": 9.894328236579895, + "mean_norm/layer15": 10.086170971393585, + "mean_norm/layer16": 9.694756627082825, + "mean_norm/layer17": 10.049719512462616, + "mean_norm/layer18": 9.76311081647873, + "mean_norm/layer19": 9.784685909748077, + "mean_norm/layer2": 8.552568674087524, + "mean_norm/layer20": 9.884812831878662, + "mean_norm/layer21": 9.83890050649643, + "mean_norm/layer22": 10.464799404144287, + "mean_norm/layer23": 10.425880491733551, + "mean_norm/layer3": 9.98993718624115, + "mean_norm/layer4": 9.300775229930878, + "mean_norm/layer5": 10.755446791648865, + "mean_norm/layer6": 8.997404158115387, + "mean_norm/layer7": 9.328621327877045, + "mean_norm/layer8": 9.63390564918518, + "mean_norm/layer9": 9.59332013130188, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5150 + }, + { + "epoch": 2.15, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4562287308907574, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7837729454040527, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8574, + "eval_samples_per_second": 20.325, + "eval_steps_per_second": 0.675, + "step": 5150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.17, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6557, + "max_norm": 23.14448356628418, + "max_norm/layer0": 18.320140838623047, + "max_norm/layer1": 19.293155670166016, + "max_norm/layer10": 20.861385345458984, + "max_norm/layer11": 19.622970581054688, + "max_norm/layer12": 20.83387565612793, + "max_norm/layer13": 18.22727394104004, + "max_norm/layer14": 19.7342586517334, + "max_norm/layer15": 22.176088333129883, + "max_norm/layer16": 19.23335075378418, + "max_norm/layer17": 22.15247917175293, + "max_norm/layer18": 19.74405860900879, + "max_norm/layer19": 19.428447723388672, + "max_norm/layer2": 16.106197357177734, + "max_norm/layer20": 20.740074157714844, + "max_norm/layer21": 20.21061897277832, + "max_norm/layer22": 20.575672149658203, + "max_norm/layer23": 20.196548461914062, + "max_norm/layer3": 18.64171600341797, + "max_norm/layer4": 19.0919132232666, + "max_norm/layer5": 23.14448356628418, + "max_norm/layer6": 17.518203735351562, + "max_norm/layer7": 20.20140838623047, + "max_norm/layer8": 20.656841278076172, + "max_norm/layer9": 20.232519149780273, + "mean_norm": 9.758909354607264, + "mean_norm/layer0": 9.285945355892181, + "mean_norm/layer1": 9.340204358100891, + "mean_norm/layer10": 9.669862568378448, + "mean_norm/layer11": 9.86609172821045, + "mean_norm/layer12": 10.160631120204926, + "mean_norm/layer13": 9.630088806152344, + "mean_norm/layer14": 9.907589554786682, + "mean_norm/layer15": 10.100898385047913, + "mean_norm/layer16": 9.706718385219574, + "mean_norm/layer17": 10.063713669776917, + "mean_norm/layer18": 9.77525269985199, + "mean_norm/layer19": 9.797052562236786, + "mean_norm/layer2": 8.556278944015503, + "mean_norm/layer20": 9.89769971370697, + "mean_norm/layer21": 9.851765871047974, + "mean_norm/layer22": 10.482112884521484, + "mean_norm/layer23": 10.442677736282349, + "mean_norm/layer3": 10.004293620586395, + "mean_norm/layer4": 9.30946832895279, + "mean_norm/layer5": 10.774869859218597, + "mean_norm/layer6": 9.004033982753754, + "mean_norm/layer7": 9.337443828582764, + "mean_norm/layer8": 9.644962728023529, + "mean_norm/layer9": 9.604167819023132, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5200 + }, + { + "epoch": 2.17, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45675602227603296, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7779088020324707, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8191, + "eval_samples_per_second": 20.391, + "eval_steps_per_second": 0.677, + "step": 5200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.19, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6622, + "max_norm": 23.266572952270508, + "max_norm/layer0": 18.395366668701172, + "max_norm/layer1": 19.405048370361328, + "max_norm/layer10": 20.944896697998047, + "max_norm/layer11": 19.703922271728516, + "max_norm/layer12": 20.931015014648438, + "max_norm/layer13": 18.32317543029785, + "max_norm/layer14": 19.821910858154297, + "max_norm/layer15": 22.291412353515625, + "max_norm/layer16": 19.31391716003418, + "max_norm/layer17": 22.261930465698242, + "max_norm/layer18": 19.85706901550293, + "max_norm/layer19": 19.519027709960938, + "max_norm/layer2": 16.164764404296875, + "max_norm/layer20": 20.836637496948242, + "max_norm/layer21": 20.297468185424805, + "max_norm/layer22": 20.689680099487305, + "max_norm/layer23": 20.2936954498291, + "max_norm/layer3": 18.744632720947266, + "max_norm/layer4": 19.17936897277832, + "max_norm/layer5": 23.266572952270508, + "max_norm/layer6": 17.58405876159668, + "max_norm/layer7": 20.27602195739746, + "max_norm/layer8": 20.73196029663086, + "max_norm/layer9": 20.32901382446289, + "mean_norm": 9.770990287264189, + "mean_norm/layer0": 9.297839343547821, + "mean_norm/layer1": 9.350374460220337, + "mean_norm/layer10": 9.681010365486145, + "mean_norm/layer11": 9.878672003746033, + "mean_norm/layer12": 10.175971269607544, + "mean_norm/layer13": 9.64153653383255, + "mean_norm/layer14": 9.920740842819214, + "mean_norm/layer15": 10.1153604388237, + "mean_norm/layer16": 9.718545377254486, + "mean_norm/layer17": 10.077604353427887, + "mean_norm/layer18": 9.787011325359344, + "mean_norm/layer19": 9.809286177158356, + "mean_norm/layer2": 8.559925496578217, + "mean_norm/layer20": 9.910324573516846, + "mean_norm/layer21": 9.864007830619812, + "mean_norm/layer22": 10.498671770095825, + "mean_norm/layer23": 10.459164440631866, + "mean_norm/layer3": 10.01849776506424, + "mean_norm/layer4": 9.317963421344757, + "mean_norm/layer5": 10.793861210346222, + "mean_norm/layer6": 9.010525822639465, + "mean_norm/layer7": 9.346060633659363, + "mean_norm/layer8": 9.655949771404266, + "mean_norm/layer9": 9.61486166715622, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5250 + }, + { + "epoch": 2.19, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4562327869783364, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7806594371795654, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8078, + "eval_samples_per_second": 20.41, + "eval_steps_per_second": 0.678, + "step": 5250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.21, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6863, + "max_norm": 23.383268356323242, + "max_norm/layer0": 18.473617553710938, + "max_norm/layer1": 19.516151428222656, + "max_norm/layer10": 21.03118324279785, + "max_norm/layer11": 19.796005249023438, + "max_norm/layer12": 21.034351348876953, + "max_norm/layer13": 18.400510787963867, + "max_norm/layer14": 19.89116859436035, + "max_norm/layer15": 22.391456604003906, + "max_norm/layer16": 19.405385971069336, + "max_norm/layer17": 22.3623046875, + "max_norm/layer18": 19.993558883666992, + "max_norm/layer19": 19.62684440612793, + "max_norm/layer2": 16.235048294067383, + "max_norm/layer20": 20.942127227783203, + "max_norm/layer21": 20.385709762573242, + "max_norm/layer22": 20.807687759399414, + "max_norm/layer23": 20.388404846191406, + "max_norm/layer3": 18.837236404418945, + "max_norm/layer4": 19.27210235595703, + "max_norm/layer5": 23.383268356323242, + "max_norm/layer6": 17.637849807739258, + "max_norm/layer7": 20.35446548461914, + "max_norm/layer8": 20.819650650024414, + "max_norm/layer9": 20.413063049316406, + "mean_norm": 9.782849095761776, + "mean_norm/layer0": 9.30956506729126, + "mean_norm/layer1": 9.360318064689636, + "mean_norm/layer10": 9.691880643367767, + "mean_norm/layer11": 9.891013085842133, + "mean_norm/layer12": 10.190861105918884, + "mean_norm/layer13": 9.652708292007446, + "mean_norm/layer14": 9.933558821678162, + "mean_norm/layer15": 10.129729926586151, + "mean_norm/layer16": 9.730214476585388, + "mean_norm/layer17": 10.091246604919434, + "mean_norm/layer18": 9.79846078157425, + "mean_norm/layer19": 9.821033775806427, + "mean_norm/layer2": 8.563501000404358, + "mean_norm/layer20": 9.922536730766296, + "mean_norm/layer21": 9.876113593578339, + "mean_norm/layer22": 10.515062034130096, + "mean_norm/layer23": 10.47534316778183, + "mean_norm/layer3": 10.032526850700378, + "mean_norm/layer4": 9.326524913311005, + "mean_norm/layer5": 10.812679052352905, + "mean_norm/layer6": 9.016940891742706, + "mean_norm/layer7": 9.354610204696655, + "mean_norm/layer8": 9.666627705097198, + "mean_norm/layer9": 9.625321507453918, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5300 + }, + { + "epoch": 2.21, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45746178151478645, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7769699096679688, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.555, + "eval_samples_per_second": 20.857, + "eval_steps_per_second": 0.692, + "step": 5300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.23, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.679, + "max_norm": 23.499439239501953, + "max_norm/layer0": 18.54343032836914, + "max_norm/layer1": 19.622438430786133, + "max_norm/layer10": 21.115442276000977, + "max_norm/layer11": 19.91941261291504, + "max_norm/layer12": 21.136581420898438, + "max_norm/layer13": 18.484241485595703, + "max_norm/layer14": 19.956186294555664, + "max_norm/layer15": 22.505870819091797, + "max_norm/layer16": 19.49273109436035, + "max_norm/layer17": 22.469552993774414, + "max_norm/layer18": 20.106782913208008, + "max_norm/layer19": 19.725515365600586, + "max_norm/layer2": 16.305809020996094, + "max_norm/layer20": 21.03738021850586, + "max_norm/layer21": 20.470613479614258, + "max_norm/layer22": 20.912168502807617, + "max_norm/layer23": 20.484712600708008, + "max_norm/layer3": 18.927547454833984, + "max_norm/layer4": 19.371742248535156, + "max_norm/layer5": 23.499439239501953, + "max_norm/layer6": 17.688518524169922, + "max_norm/layer7": 20.45281219482422, + "max_norm/layer8": 20.927034378051758, + "max_norm/layer9": 20.496910095214844, + "mean_norm": 9.794714162747065, + "mean_norm/layer0": 9.321279466152191, + "mean_norm/layer1": 9.370379328727722, + "mean_norm/layer10": 9.702701926231384, + "mean_norm/layer11": 9.903493821620941, + "mean_norm/layer12": 10.205870807170868, + "mean_norm/layer13": 9.66382622718811, + "mean_norm/layer14": 9.94619619846344, + "mean_norm/layer15": 10.14408254623413, + "mean_norm/layer16": 9.741806030273438, + "mean_norm/layer17": 10.104702532291412, + "mean_norm/layer18": 9.809928119182587, + "mean_norm/layer19": 9.832951545715332, + "mean_norm/layer2": 8.567113637924194, + "mean_norm/layer20": 9.934588551521301, + "mean_norm/layer21": 9.888190269470215, + "mean_norm/layer22": 10.531676888465881, + "mean_norm/layer23": 10.491473019123077, + "mean_norm/layer3": 10.046574115753174, + "mean_norm/layer4": 9.33499801158905, + "mean_norm/layer5": 10.831702411174774, + "mean_norm/layer6": 9.023348093032837, + "mean_norm/layer7": 9.363218486309052, + "mean_norm/layer8": 9.677422285079956, + "mean_norm/layer9": 9.635615587234497, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5350 + }, + { + "epoch": 2.23, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4568695927282462, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.774198055267334, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8138, + "eval_samples_per_second": 20.4, + "eval_steps_per_second": 0.677, + "step": 5350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.25, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6657, + "max_norm": 23.616012573242188, + "max_norm/layer0": 18.616952896118164, + "max_norm/layer1": 19.73339080810547, + "max_norm/layer10": 21.219606399536133, + "max_norm/layer11": 20.00966453552246, + "max_norm/layer12": 21.244117736816406, + "max_norm/layer13": 18.585554122924805, + "max_norm/layer14": 20.035675048828125, + "max_norm/layer15": 22.61372947692871, + "max_norm/layer16": 19.60413360595703, + "max_norm/layer17": 22.56954574584961, + "max_norm/layer18": 20.213354110717773, + "max_norm/layer19": 19.81522560119629, + "max_norm/layer2": 16.383325576782227, + "max_norm/layer20": 21.13914680480957, + "max_norm/layer21": 20.564655303955078, + "max_norm/layer22": 21.007658004760742, + "max_norm/layer23": 20.579490661621094, + "max_norm/layer3": 19.023515701293945, + "max_norm/layer4": 19.47603416442871, + "max_norm/layer5": 23.616012573242188, + "max_norm/layer6": 17.729270935058594, + "max_norm/layer7": 20.534603118896484, + "max_norm/layer8": 21.014896392822266, + "max_norm/layer9": 20.589609146118164, + "mean_norm": 9.806618705391884, + "mean_norm/layer0": 9.33316719532013, + "mean_norm/layer1": 9.38050252199173, + "mean_norm/layer10": 9.713618159294128, + "mean_norm/layer11": 9.915963411331177, + "mean_norm/layer12": 10.220970749855042, + "mean_norm/layer13": 9.674981594085693, + "mean_norm/layer14": 9.959041476249695, + "mean_norm/layer15": 10.158335328102112, + "mean_norm/layer16": 9.753474414348602, + "mean_norm/layer17": 10.118220508098602, + "mean_norm/layer18": 9.821493268013, + "mean_norm/layer19": 9.844790577888489, + "mean_norm/layer2": 8.570688605308533, + "mean_norm/layer20": 9.946804225444794, + "mean_norm/layer21": 9.90015572309494, + "mean_norm/layer22": 10.548267424106598, + "mean_norm/layer23": 10.507667362689972, + "mean_norm/layer3": 10.06048858165741, + "mean_norm/layer4": 9.343421339988708, + "mean_norm/layer5": 10.850700914859772, + "mean_norm/layer6": 9.029772937297821, + "mean_norm/layer7": 9.37190467119217, + "mean_norm/layer8": 9.68824589252472, + "mean_norm/layer9": 9.646172046661377, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5400 + }, + { + "epoch": 2.25, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45795662419942973, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.773238182067871, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8161, + "eval_samples_per_second": 20.396, + "eval_steps_per_second": 0.677, + "step": 5400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.28, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6707, + "max_norm": 23.711584091186523, + "max_norm/layer0": 18.696035385131836, + "max_norm/layer1": 19.86383628845215, + "max_norm/layer10": 21.319568634033203, + "max_norm/layer11": 20.104448318481445, + "max_norm/layer12": 21.343198776245117, + "max_norm/layer13": 18.65641212463379, + "max_norm/layer14": 20.11650848388672, + "max_norm/layer15": 22.714111328125, + "max_norm/layer16": 19.710603713989258, + "max_norm/layer17": 22.677001953125, + "max_norm/layer18": 20.324527740478516, + "max_norm/layer19": 19.905961990356445, + "max_norm/layer2": 16.444032669067383, + "max_norm/layer20": 21.24724769592285, + "max_norm/layer21": 20.659025192260742, + "max_norm/layer22": 21.11807632446289, + "max_norm/layer23": 20.669883728027344, + "max_norm/layer3": 19.120800018310547, + "max_norm/layer4": 19.565460205078125, + "max_norm/layer5": 23.711584091186523, + "max_norm/layer6": 17.779829025268555, + "max_norm/layer7": 20.61775016784668, + "max_norm/layer8": 21.11190414428711, + "max_norm/layer9": 20.662193298339844, + "mean_norm": 9.81824733565251, + "mean_norm/layer0": 9.344789624214172, + "mean_norm/layer1": 9.390469372272491, + "mean_norm/layer10": 9.724392533302307, + "mean_norm/layer11": 9.928160071372986, + "mean_norm/layer12": 10.235535979270935, + "mean_norm/layer13": 9.685753464698792, + "mean_norm/layer14": 9.971448719501495, + "mean_norm/layer15": 10.172397494316101, + "mean_norm/layer16": 9.764802813529968, + "mean_norm/layer17": 10.131413161754608, + "mean_norm/layer18": 9.832902252674103, + "mean_norm/layer19": 9.856505811214447, + "mean_norm/layer2": 8.574154257774353, + "mean_norm/layer20": 9.958525598049164, + "mean_norm/layer21": 9.912037432193756, + "mean_norm/layer22": 10.564294755458832, + "mean_norm/layer23": 10.523465871810913, + "mean_norm/layer3": 10.074239313602448, + "mean_norm/layer4": 9.351719319820404, + "mean_norm/layer5": 10.869217932224274, + "mean_norm/layer6": 9.036074459552765, + "mean_norm/layer7": 9.380382359027863, + "mean_norm/layer8": 9.698756694793701, + "mean_norm/layer9": 9.65649676322937, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5450 + }, + { + "epoch": 2.28, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4583906255703873, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.767972230911255, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5723, + "eval_samples_per_second": 20.826, + "eval_steps_per_second": 0.691, + "step": 5450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.3, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6828, + "max_norm": 23.828529357910156, + "max_norm/layer0": 18.77942657470703, + "max_norm/layer1": 19.9698486328125, + "max_norm/layer10": 21.414457321166992, + "max_norm/layer11": 20.17760467529297, + "max_norm/layer12": 21.42694854736328, + "max_norm/layer13": 18.734359741210938, + "max_norm/layer14": 20.196672439575195, + "max_norm/layer15": 22.838233947753906, + "max_norm/layer16": 19.811031341552734, + "max_norm/layer17": 22.79621696472168, + "max_norm/layer18": 20.419069290161133, + "max_norm/layer19": 20.007299423217773, + "max_norm/layer2": 16.4896183013916, + "max_norm/layer20": 21.348735809326172, + "max_norm/layer21": 20.764799118041992, + "max_norm/layer22": 21.221994400024414, + "max_norm/layer23": 20.771209716796875, + "max_norm/layer3": 19.219717025756836, + "max_norm/layer4": 19.63283348083496, + "max_norm/layer5": 23.828529357910156, + "max_norm/layer6": 17.82144546508789, + "max_norm/layer7": 20.713653564453125, + "max_norm/layer8": 21.195741653442383, + "max_norm/layer9": 20.749263763427734, + "mean_norm": 9.829934562246004, + "mean_norm/layer0": 9.356457650661469, + "mean_norm/layer1": 9.400355875492096, + "mean_norm/layer10": 9.735199213027954, + "mean_norm/layer11": 9.940261006355286, + "mean_norm/layer12": 10.250323474407196, + "mean_norm/layer13": 9.696837365627289, + "mean_norm/layer14": 9.98394638299942, + "mean_norm/layer15": 10.186484932899475, + "mean_norm/layer16": 9.776153683662415, + "mean_norm/layer17": 10.144715905189514, + "mean_norm/layer18": 9.844414174556732, + "mean_norm/layer19": 9.86827665567398, + "mean_norm/layer2": 8.577622711658478, + "mean_norm/layer20": 9.970131814479828, + "mean_norm/layer21": 9.923815429210663, + "mean_norm/layer22": 10.580283641815186, + "mean_norm/layer23": 10.539456129074097, + "mean_norm/layer3": 10.088192164897919, + "mean_norm/layer4": 9.360041677951813, + "mean_norm/layer5": 10.888111174106598, + "mean_norm/layer6": 9.042340636253357, + "mean_norm/layer7": 9.388883471488953, + "mean_norm/layer8": 9.709352374076843, + "mean_norm/layer9": 9.666771948337555, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5500 + }, + { + "epoch": 2.3, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45791200723606024, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7675321102142334, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8324, + "eval_samples_per_second": 20.368, + "eval_steps_per_second": 0.676, + "step": 5500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.32, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.669, + "max_norm": 23.937562942504883, + "max_norm/layer0": 18.859041213989258, + "max_norm/layer1": 20.078290939331055, + "max_norm/layer10": 21.511146545410156, + "max_norm/layer11": 20.23717498779297, + "max_norm/layer12": 21.525150299072266, + "max_norm/layer13": 18.80620765686035, + "max_norm/layer14": 20.277151107788086, + "max_norm/layer15": 22.951562881469727, + "max_norm/layer16": 19.92555809020996, + "max_norm/layer17": 22.931133270263672, + "max_norm/layer18": 20.521669387817383, + "max_norm/layer19": 20.11891746520996, + "max_norm/layer2": 16.537145614624023, + "max_norm/layer20": 21.444211959838867, + "max_norm/layer21": 20.847387313842773, + "max_norm/layer22": 21.34566879272461, + "max_norm/layer23": 20.86615562438965, + "max_norm/layer3": 19.326074600219727, + "max_norm/layer4": 19.71425437927246, + "max_norm/layer5": 23.937562942504883, + "max_norm/layer6": 17.873159408569336, + "max_norm/layer7": 20.806289672851562, + "max_norm/layer8": 21.297988891601562, + "max_norm/layer9": 20.845129013061523, + "mean_norm": 9.841606857875982, + "mean_norm/layer0": 9.368158996105194, + "mean_norm/layer1": 9.410395383834839, + "mean_norm/layer10": 9.74589717388153, + "mean_norm/layer11": 9.952390968799591, + "mean_norm/layer12": 10.265121459960938, + "mean_norm/layer13": 9.707781314849854, + "mean_norm/layer14": 9.996495127677917, + "mean_norm/layer15": 10.20052945613861, + "mean_norm/layer16": 9.78744912147522, + "mean_norm/layer17": 10.157939553260803, + "mean_norm/layer18": 9.85572999715805, + "mean_norm/layer19": 9.879987061023712, + "mean_norm/layer2": 8.581217646598816, + "mean_norm/layer20": 9.981558501720428, + "mean_norm/layer21": 9.935706377029419, + "mean_norm/layer22": 10.596454083919525, + "mean_norm/layer23": 10.555343270301819, + "mean_norm/layer3": 10.10208147764206, + "mean_norm/layer4": 9.36821448802948, + "mean_norm/layer5": 10.906881392002106, + "mean_norm/layer6": 9.04877257347107, + "mean_norm/layer7": 9.397431671619415, + "mean_norm/layer8": 9.720013678073883, + "mean_norm/layer9": 9.67701381444931, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5550 + }, + { + "epoch": 2.32, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45954255444283554, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7617156505584717, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8254, + "eval_samples_per_second": 20.38, + "eval_steps_per_second": 0.677, + "step": 5550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.34, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6786, + "max_norm": 24.050399780273438, + "max_norm/layer0": 18.92856788635254, + "max_norm/layer1": 20.19409942626953, + "max_norm/layer10": 21.61579704284668, + "max_norm/layer11": 20.31001853942871, + "max_norm/layer12": 21.62428092956543, + "max_norm/layer13": 18.889577865600586, + "max_norm/layer14": 20.359472274780273, + "max_norm/layer15": 23.067659378051758, + "max_norm/layer16": 20.03011131286621, + "max_norm/layer17": 23.0419864654541, + "max_norm/layer18": 20.61798667907715, + "max_norm/layer19": 20.219560623168945, + "max_norm/layer2": 16.568180084228516, + "max_norm/layer20": 21.540401458740234, + "max_norm/layer21": 20.965660095214844, + "max_norm/layer22": 21.44856071472168, + "max_norm/layer23": 20.963855743408203, + "max_norm/layer3": 19.419219970703125, + "max_norm/layer4": 19.802261352539062, + "max_norm/layer5": 24.050399780273438, + "max_norm/layer6": 17.924131393432617, + "max_norm/layer7": 20.910070419311523, + "max_norm/layer8": 21.38106918334961, + "max_norm/layer9": 20.933855056762695, + "mean_norm": 9.853289564450582, + "mean_norm/layer0": 9.379805266857147, + "mean_norm/layer1": 9.420386135578156, + "mean_norm/layer10": 9.756702065467834, + "mean_norm/layer11": 9.96448564529419, + "mean_norm/layer12": 10.279956340789795, + "mean_norm/layer13": 9.718806564807892, + "mean_norm/layer14": 10.008846938610077, + "mean_norm/layer15": 10.214514553546906, + "mean_norm/layer16": 9.798823893070221, + "mean_norm/layer17": 10.17122620344162, + "mean_norm/layer18": 9.867085695266724, + "mean_norm/layer19": 9.89163064956665, + "mean_norm/layer2": 8.58489179611206, + "mean_norm/layer20": 9.993090152740479, + "mean_norm/layer21": 9.947735130786896, + "mean_norm/layer22": 10.612680315971375, + "mean_norm/layer23": 10.571164965629578, + "mean_norm/layer3": 10.11597990989685, + "mean_norm/layer4": 9.376480102539062, + "mean_norm/layer5": 10.925587713718414, + "mean_norm/layer6": 9.055172681808472, + "mean_norm/layer7": 9.405917942523956, + "mean_norm/layer8": 9.730691254138947, + "mean_norm/layer9": 9.687287628650665, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5600 + }, + { + "epoch": 2.34, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45928702092535584, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.764376401901245, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8216, + "eval_samples_per_second": 20.386, + "eval_steps_per_second": 0.677, + "step": 5600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.36, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6938, + "max_norm": 24.169326782226562, + "max_norm/layer0": 19.0015926361084, + "max_norm/layer1": 20.306058883666992, + "max_norm/layer10": 21.70053482055664, + "max_norm/layer11": 20.392311096191406, + "max_norm/layer12": 21.714736938476562, + "max_norm/layer13": 18.960250854492188, + "max_norm/layer14": 20.45236587524414, + "max_norm/layer15": 23.201778411865234, + "max_norm/layer16": 20.125362396240234, + "max_norm/layer17": 23.156299591064453, + "max_norm/layer18": 20.71641731262207, + "max_norm/layer19": 20.32011604309082, + "max_norm/layer2": 16.6474666595459, + "max_norm/layer20": 21.623586654663086, + "max_norm/layer21": 21.088895797729492, + "max_norm/layer22": 21.558412551879883, + "max_norm/layer23": 21.069276809692383, + "max_norm/layer3": 19.493728637695312, + "max_norm/layer4": 19.86513328552246, + "max_norm/layer5": 24.169326782226562, + "max_norm/layer6": 17.97091293334961, + "max_norm/layer7": 21.01711654663086, + "max_norm/layer8": 21.452049255371094, + "max_norm/layer9": 21.005409240722656, + "mean_norm": 9.864638393123945, + "mean_norm/layer0": 9.3911452293396, + "mean_norm/layer1": 9.430276334285736, + "mean_norm/layer10": 9.767344295978546, + "mean_norm/layer11": 9.976312398910522, + "mean_norm/layer12": 10.294341802597046, + "mean_norm/layer13": 9.729567348957062, + "mean_norm/layer14": 10.02096837759018, + "mean_norm/layer15": 10.228092610836029, + "mean_norm/layer16": 9.809804558753967, + "mean_norm/layer17": 10.18399292230606, + "mean_norm/layer18": 9.878075778484344, + "mean_norm/layer19": 9.902792990207672, + "mean_norm/layer2": 8.58851420879364, + "mean_norm/layer20": 10.004315316677094, + "mean_norm/layer21": 9.95916599035263, + "mean_norm/layer22": 10.628167688846588, + "mean_norm/layer23": 10.586232781410217, + "mean_norm/layer3": 10.129510223865509, + "mean_norm/layer4": 9.384777843952179, + "mean_norm/layer5": 10.943991243839264, + "mean_norm/layer6": 9.061299085617065, + "mean_norm/layer7": 9.414314091205597, + "mean_norm/layer8": 9.741056561470032, + "mean_norm/layer9": 9.69726175069809, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5650 + }, + { + "epoch": 2.36, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.45997655581379315, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.759434223175049, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5486, + "eval_samples_per_second": 20.868, + "eval_steps_per_second": 0.693, + "step": 5650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.38, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6634, + "max_norm": 24.302297592163086, + "max_norm/layer0": 19.074230194091797, + "max_norm/layer1": 20.415058135986328, + "max_norm/layer10": 21.800249099731445, + "max_norm/layer11": 20.47414779663086, + "max_norm/layer12": 21.825576782226562, + "max_norm/layer13": 19.0487060546875, + "max_norm/layer14": 20.540529251098633, + "max_norm/layer15": 23.310043334960938, + "max_norm/layer16": 20.21319007873535, + "max_norm/layer17": 23.27543067932129, + "max_norm/layer18": 20.82416534423828, + "max_norm/layer19": 20.435667037963867, + "max_norm/layer2": 16.726856231689453, + "max_norm/layer20": 21.711185455322266, + "max_norm/layer21": 21.18751335144043, + "max_norm/layer22": 21.662084579467773, + "max_norm/layer23": 21.18093490600586, + "max_norm/layer3": 19.574790954589844, + "max_norm/layer4": 19.932098388671875, + "max_norm/layer5": 24.302297592163086, + "max_norm/layer6": 18.029502868652344, + "max_norm/layer7": 21.126331329345703, + "max_norm/layer8": 21.547332763671875, + "max_norm/layer9": 21.09630584716797, + "mean_norm": 9.876142094532648, + "mean_norm/layer0": 9.402709722518921, + "mean_norm/layer1": 9.440324366092682, + "mean_norm/layer10": 9.777914643287659, + "mean_norm/layer11": 9.988339364528656, + "mean_norm/layer12": 10.308962106704712, + "mean_norm/layer13": 9.740558981895447, + "mean_norm/layer14": 10.03328812122345, + "mean_norm/layer15": 10.241935729980469, + "mean_norm/layer16": 9.820912420749664, + "mean_norm/layer17": 10.196899771690369, + "mean_norm/layer18": 9.889229655265808, + "mean_norm/layer19": 9.913987636566162, + "mean_norm/layer2": 8.59205949306488, + "mean_norm/layer20": 10.01566457748413, + "mean_norm/layer21": 9.970516860485077, + "mean_norm/layer22": 10.643815875053406, + "mean_norm/layer23": 10.601855099201202, + "mean_norm/layer3": 10.143052756786346, + "mean_norm/layer4": 9.393064022064209, + "mean_norm/layer5": 10.962677597999573, + "mean_norm/layer6": 9.067675769329071, + "mean_norm/layer7": 9.4227814078331, + "mean_norm/layer8": 9.751694977283478, + "mean_norm/layer9": 9.707489311695099, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5700 + }, + { + "epoch": 2.38, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4612258307881384, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.753422975540161, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8169, + "eval_samples_per_second": 20.395, + "eval_steps_per_second": 0.677, + "step": 5700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.4, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6744, + "max_norm": 24.415847778320312, + "max_norm/layer0": 19.146425247192383, + "max_norm/layer1": 20.51773452758789, + "max_norm/layer10": 21.890947341918945, + "max_norm/layer11": 20.550748825073242, + "max_norm/layer12": 21.946949005126953, + "max_norm/layer13": 19.112741470336914, + "max_norm/layer14": 20.610857009887695, + "max_norm/layer15": 23.442441940307617, + "max_norm/layer16": 20.31297492980957, + "max_norm/layer17": 23.392274856567383, + "max_norm/layer18": 20.90896987915039, + "max_norm/layer19": 20.549793243408203, + "max_norm/layer2": 16.79773712158203, + "max_norm/layer20": 21.813404083251953, + "max_norm/layer21": 21.293352127075195, + "max_norm/layer22": 21.788415908813477, + "max_norm/layer23": 21.271108627319336, + "max_norm/layer3": 19.66872787475586, + "max_norm/layer4": 19.997684478759766, + "max_norm/layer5": 24.415847778320312, + "max_norm/layer6": 18.082775115966797, + "max_norm/layer7": 21.22279167175293, + "max_norm/layer8": 21.611251831054688, + "max_norm/layer9": 21.174211502075195, + "mean_norm": 9.887629655500254, + "mean_norm/layer0": 9.41416311264038, + "mean_norm/layer1": 9.450378060340881, + "mean_norm/layer10": 9.788468480110168, + "mean_norm/layer11": 10.000294208526611, + "mean_norm/layer12": 10.323612809181213, + "mean_norm/layer13": 9.751441478729248, + "mean_norm/layer14": 10.045649409294128, + "mean_norm/layer15": 10.255648970603943, + "mean_norm/layer16": 9.831993281841278, + "mean_norm/layer17": 10.209833085536957, + "mean_norm/layer18": 9.900463461875916, + "mean_norm/layer19": 9.925138771533966, + "mean_norm/layer2": 8.595655858516693, + "mean_norm/layer20": 10.027330756187439, + "mean_norm/layer21": 9.981902122497559, + "mean_norm/layer22": 10.65961903333664, + "mean_norm/layer23": 10.617213129997253, + "mean_norm/layer3": 10.156732320785522, + "mean_norm/layer4": 9.401276051998138, + "mean_norm/layer5": 10.9812912940979, + "mean_norm/layer6": 9.073957800865173, + "mean_norm/layer7": 9.43110179901123, + "mean_norm/layer8": 9.762260735034943, + "mean_norm/layer9": 9.71768569946289, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5750 + }, + { + "epoch": 2.4, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46095812900792155, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7510087490081787, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6121, + "eval_samples_per_second": 20.754, + "eval_steps_per_second": 0.689, + "step": 5750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.42, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6799, + "max_norm": 24.525354385375977, + "max_norm/layer0": 19.21927833557129, + "max_norm/layer1": 20.611085891723633, + "max_norm/layer10": 21.969202041625977, + "max_norm/layer11": 20.64573860168457, + "max_norm/layer12": 22.06580352783203, + "max_norm/layer13": 19.187246322631836, + "max_norm/layer14": 20.70265007019043, + "max_norm/layer15": 23.571685791015625, + "max_norm/layer16": 20.39738655090332, + "max_norm/layer17": 23.50619125366211, + "max_norm/layer18": 20.994590759277344, + "max_norm/layer19": 20.64227867126465, + "max_norm/layer2": 16.8626651763916, + "max_norm/layer20": 21.89752197265625, + "max_norm/layer21": 21.396255493164062, + "max_norm/layer22": 21.888132095336914, + "max_norm/layer23": 21.377004623413086, + "max_norm/layer3": 19.76741600036621, + "max_norm/layer4": 20.093164443969727, + "max_norm/layer5": 24.525354385375977, + "max_norm/layer6": 18.127910614013672, + "max_norm/layer7": 21.337644577026367, + "max_norm/layer8": 21.689964294433594, + "max_norm/layer9": 21.269315719604492, + "mean_norm": 9.899055920541286, + "mean_norm/layer0": 9.425514936447144, + "mean_norm/layer1": 9.460303664207458, + "mean_norm/layer10": 9.798951029777527, + "mean_norm/layer11": 10.012129306793213, + "mean_norm/layer12": 10.338140368461609, + "mean_norm/layer13": 9.762259364128113, + "mean_norm/layer14": 10.057992458343506, + "mean_norm/layer15": 10.26939058303833, + "mean_norm/layer16": 9.843165934085846, + "mean_norm/layer17": 10.222750306129456, + "mean_norm/layer18": 9.911642968654633, + "mean_norm/layer19": 9.936326265335083, + "mean_norm/layer2": 8.599254548549652, + "mean_norm/layer20": 10.038680911064148, + "mean_norm/layer21": 9.993187129497528, + "mean_norm/layer22": 10.675156891345978, + "mean_norm/layer23": 10.632552742958069, + "mean_norm/layer3": 10.170215964317322, + "mean_norm/layer4": 9.40942233800888, + "mean_norm/layer5": 10.999845743179321, + "mean_norm/layer6": 9.080201625823975, + "mean_norm/layer7": 9.439405918121338, + "mean_norm/layer8": 9.772936880588531, + "mean_norm/layer9": 9.727914214134216, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5800 + }, + { + "epoch": 2.42, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4608202220302341, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7505526542663574, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7927, + "eval_samples_per_second": 20.436, + "eval_steps_per_second": 0.678, + "step": 5800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.44, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6799, + "max_norm": 24.64824676513672, + "max_norm/layer0": 19.30046844482422, + "max_norm/layer1": 20.69877815246582, + "max_norm/layer10": 22.053220748901367, + "max_norm/layer11": 20.724355697631836, + "max_norm/layer12": 22.196802139282227, + "max_norm/layer13": 19.268417358398438, + "max_norm/layer14": 20.79410171508789, + "max_norm/layer15": 23.694843292236328, + "max_norm/layer16": 20.494922637939453, + "max_norm/layer17": 23.64689064025879, + "max_norm/layer18": 21.078306198120117, + "max_norm/layer19": 20.727556228637695, + "max_norm/layer2": 16.929187774658203, + "max_norm/layer20": 21.985841751098633, + "max_norm/layer21": 21.498451232910156, + "max_norm/layer22": 21.993858337402344, + "max_norm/layer23": 21.484207153320312, + "max_norm/layer3": 19.888816833496094, + "max_norm/layer4": 20.171184539794922, + "max_norm/layer5": 24.64824676513672, + "max_norm/layer6": 18.182086944580078, + "max_norm/layer7": 21.449859619140625, + "max_norm/layer8": 21.770164489746094, + "max_norm/layer9": 21.34680938720703, + "mean_norm": 9.910489511986574, + "mean_norm/layer0": 9.436944603919983, + "mean_norm/layer1": 9.470270037651062, + "mean_norm/layer10": 9.809482991695404, + "mean_norm/layer11": 10.023900032043457, + "mean_norm/layer12": 10.35284686088562, + "mean_norm/layer13": 9.773071646690369, + "mean_norm/layer14": 10.070310354232788, + "mean_norm/layer15": 10.283128798007965, + "mean_norm/layer16": 9.854249835014343, + "mean_norm/layer17": 10.235677301883698, + "mean_norm/layer18": 9.922667562961578, + "mean_norm/layer19": 9.947410225868225, + "mean_norm/layer2": 8.602798521518707, + "mean_norm/layer20": 10.04989892244339, + "mean_norm/layer21": 10.00466388463974, + "mean_norm/layer22": 10.69081175327301, + "mean_norm/layer23": 10.647965610027313, + "mean_norm/layer3": 10.18393588066101, + "mean_norm/layer4": 9.417515218257904, + "mean_norm/layer5": 11.018384039402008, + "mean_norm/layer6": 9.086404740810394, + "mean_norm/layer7": 9.447878897190094, + "mean_norm/layer8": 9.78347784280777, + "mean_norm/layer9": 9.738052725791931, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5850 + }, + { + "epoch": 2.44, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4599846679889512, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.754044771194458, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8217, + "eval_samples_per_second": 20.386, + "eval_steps_per_second": 0.677, + "step": 5850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.46, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6767, + "max_norm": 24.753965377807617, + "max_norm/layer0": 19.378158569335938, + "max_norm/layer1": 20.807764053344727, + "max_norm/layer10": 22.12616539001465, + "max_norm/layer11": 20.805105209350586, + "max_norm/layer12": 22.287803649902344, + "max_norm/layer13": 19.338436126708984, + "max_norm/layer14": 20.869544982910156, + "max_norm/layer15": 23.80994987487793, + "max_norm/layer16": 20.60982894897461, + "max_norm/layer17": 23.77663230895996, + "max_norm/layer18": 21.178482055664062, + "max_norm/layer19": 20.830650329589844, + "max_norm/layer2": 16.985960006713867, + "max_norm/layer20": 22.095294952392578, + "max_norm/layer21": 21.586101531982422, + "max_norm/layer22": 22.09933090209961, + "max_norm/layer23": 21.59579849243164, + "max_norm/layer3": 20.020875930786133, + "max_norm/layer4": 20.229372024536133, + "max_norm/layer5": 24.753965377807617, + "max_norm/layer6": 18.241554260253906, + "max_norm/layer7": 21.56122589111328, + "max_norm/layer8": 21.847877502441406, + "max_norm/layer9": 21.414751052856445, + "mean_norm": 9.92179693778356, + "mean_norm/layer0": 9.448293924331665, + "mean_norm/layer1": 9.480082273483276, + "mean_norm/layer10": 9.82001268863678, + "mean_norm/layer11": 10.035534679889679, + "mean_norm/layer12": 10.367335975170135, + "mean_norm/layer13": 9.783747255802155, + "mean_norm/layer14": 10.08247172832489, + "mean_norm/layer15": 10.296784579753876, + "mean_norm/layer16": 9.865318357944489, + "mean_norm/layer17": 10.248357355594635, + "mean_norm/layer18": 9.933477759361267, + "mean_norm/layer19": 9.958428800106049, + "mean_norm/layer2": 8.606263518333435, + "mean_norm/layer20": 10.06111353635788, + "mean_norm/layer21": 10.016002595424652, + "mean_norm/layer22": 10.70626699924469, + "mean_norm/layer23": 10.663025915622711, + "mean_norm/layer3": 10.197382926940918, + "mean_norm/layer4": 9.42559802532196, + "mean_norm/layer5": 11.036820828914642, + "mean_norm/layer6": 9.092549324035645, + "mean_norm/layer7": 9.456212759017944, + "mean_norm/layer8": 9.79387241601944, + "mean_norm/layer9": 9.748172283172607, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5900 + }, + { + "epoch": 2.46, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4604754545860154, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.751302719116211, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5986, + "eval_samples_per_second": 20.778, + "eval_steps_per_second": 0.69, + "step": 5900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.48, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6723, + "max_norm": 24.86185073852539, + "max_norm/layer0": 19.464832305908203, + "max_norm/layer1": 20.904747009277344, + "max_norm/layer10": 22.21963882446289, + "max_norm/layer11": 20.90224838256836, + "max_norm/layer12": 22.370943069458008, + "max_norm/layer13": 19.404891967773438, + "max_norm/layer14": 20.9664249420166, + "max_norm/layer15": 23.94396209716797, + "max_norm/layer16": 20.73137664794922, + "max_norm/layer17": 23.91629409790039, + "max_norm/layer18": 21.258281707763672, + "max_norm/layer19": 20.940629959106445, + "max_norm/layer2": 17.0539493560791, + "max_norm/layer20": 22.18185043334961, + "max_norm/layer21": 21.683847427368164, + "max_norm/layer22": 22.20035171508789, + "max_norm/layer23": 21.70345115661621, + "max_norm/layer3": 20.125995635986328, + "max_norm/layer4": 20.29149055480957, + "max_norm/layer5": 24.86185073852539, + "max_norm/layer6": 18.295093536376953, + "max_norm/layer7": 21.663230895996094, + "max_norm/layer8": 21.92238426208496, + "max_norm/layer9": 21.488218307495117, + "mean_norm": 9.932985362907251, + "mean_norm/layer0": 9.459501802921295, + "mean_norm/layer1": 9.489829063415527, + "mean_norm/layer10": 9.830254077911377, + "mean_norm/layer11": 10.04719090461731, + "mean_norm/layer12": 10.381703913211823, + "mean_norm/layer13": 9.79422265291214, + "mean_norm/layer14": 10.094463765621185, + "mean_norm/layer15": 10.310104370117188, + "mean_norm/layer16": 9.876312971115112, + "mean_norm/layer17": 10.260833084583282, + "mean_norm/layer18": 9.944314777851105, + "mean_norm/layer19": 9.969380855560303, + "mean_norm/layer2": 8.609793603420258, + "mean_norm/layer20": 10.072267889976501, + "mean_norm/layer21": 10.027061522006989, + "mean_norm/layer22": 10.721749186515808, + "mean_norm/layer23": 10.678084135055542, + "mean_norm/layer3": 10.210697650909424, + "mean_norm/layer4": 9.433561861515045, + "mean_norm/layer5": 11.054940581321716, + "mean_norm/layer6": 9.098546802997589, + "mean_norm/layer7": 9.46446293592453, + "mean_norm/layer8": 9.804116070270538, + "mean_norm/layer9": 9.75825423002243, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 5950 + }, + { + "epoch": 2.48, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46160304693298937, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.748650074005127, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.808, + "eval_samples_per_second": 22.298, + "eval_steps_per_second": 0.74, + "step": 5950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.51, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6815, + "max_norm": 24.977638244628906, + "max_norm/layer0": 19.546966552734375, + "max_norm/layer1": 20.998462677001953, + "max_norm/layer10": 22.314041137695312, + "max_norm/layer11": 20.974071502685547, + "max_norm/layer12": 22.48418617248535, + "max_norm/layer13": 19.48900032043457, + "max_norm/layer14": 21.050722122192383, + "max_norm/layer15": 24.082304000854492, + "max_norm/layer16": 20.837448120117188, + "max_norm/layer17": 24.036243438720703, + "max_norm/layer18": 21.340248107910156, + "max_norm/layer19": 21.039228439331055, + "max_norm/layer2": 17.137115478515625, + "max_norm/layer20": 22.27361297607422, + "max_norm/layer21": 21.761518478393555, + "max_norm/layer22": 22.311800003051758, + "max_norm/layer23": 21.796558380126953, + "max_norm/layer3": 20.21436309814453, + "max_norm/layer4": 20.353113174438477, + "max_norm/layer5": 24.977638244628906, + "max_norm/layer6": 18.35504150390625, + "max_norm/layer7": 21.75100326538086, + "max_norm/layer8": 22.014951705932617, + "max_norm/layer9": 21.569259643554688, + "mean_norm": 9.944234107931456, + "mean_norm/layer0": 9.470636069774628, + "mean_norm/layer1": 9.499629974365234, + "mean_norm/layer10": 9.840614199638367, + "mean_norm/layer11": 10.05879956483841, + "mean_norm/layer12": 10.396033763885498, + "mean_norm/layer13": 9.804863929748535, + "mean_norm/layer14": 10.106550097465515, + "mean_norm/layer15": 10.323493957519531, + "mean_norm/layer16": 9.887224614620209, + "mean_norm/layer17": 10.27337783575058, + "mean_norm/layer18": 9.955014765262604, + "mean_norm/layer19": 9.980344355106354, + "mean_norm/layer2": 8.613344311714172, + "mean_norm/layer20": 10.083471596240997, + "mean_norm/layer21": 10.03798758983612, + "mean_norm/layer22": 10.737454056739807, + "mean_norm/layer23": 10.69325703382492, + "mean_norm/layer3": 10.224131882190704, + "mean_norm/layer4": 9.441782593727112, + "mean_norm/layer5": 11.073285281658173, + "mean_norm/layer6": 9.104702413082123, + "mean_norm/layer7": 9.472704946994781, + "mean_norm/layer8": 9.81453275680542, + "mean_norm/layer9": 9.768380999565125, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6000 + }, + { + "epoch": 2.51, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4614570277801438, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.746541976928711, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8304, + "eval_samples_per_second": 20.371, + "eval_steps_per_second": 0.676, + "step": 6000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.53, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6786, + "max_norm": 25.10230827331543, + "max_norm/layer0": 19.610563278198242, + "max_norm/layer1": 21.094833374023438, + "max_norm/layer10": 22.392915725708008, + "max_norm/layer11": 21.059268951416016, + "max_norm/layer12": 22.60821533203125, + "max_norm/layer13": 19.56475830078125, + "max_norm/layer14": 21.15677833557129, + "max_norm/layer15": 24.223785400390625, + "max_norm/layer16": 20.94610595703125, + "max_norm/layer17": 24.151611328125, + "max_norm/layer18": 21.432071685791016, + "max_norm/layer19": 21.153385162353516, + "max_norm/layer2": 17.234243392944336, + "max_norm/layer20": 22.37726593017578, + "max_norm/layer21": 21.85563850402832, + "max_norm/layer22": 22.410329818725586, + "max_norm/layer23": 21.884920120239258, + "max_norm/layer3": 20.298763275146484, + "max_norm/layer4": 20.410865783691406, + "max_norm/layer5": 25.10230827331543, + "max_norm/layer6": 18.404077529907227, + "max_norm/layer7": 21.845476150512695, + "max_norm/layer8": 22.08577537536621, + "max_norm/layer9": 21.64267349243164, + "mean_norm": 9.955603557328383, + "mean_norm/layer0": 9.481941640377045, + "mean_norm/layer1": 9.509676814079285, + "mean_norm/layer10": 9.851111769676208, + "mean_norm/layer11": 10.070666432380676, + "mean_norm/layer12": 10.410649418830872, + "mean_norm/layer13": 9.815576553344727, + "mean_norm/layer14": 10.118753135204315, + "mean_norm/layer15": 10.337125837802887, + "mean_norm/layer16": 9.898253440856934, + "mean_norm/layer17": 10.28607988357544, + "mean_norm/layer18": 9.965818166732788, + "mean_norm/layer19": 9.991341471672058, + "mean_norm/layer2": 8.616923332214355, + "mean_norm/layer20": 10.094838857650757, + "mean_norm/layer21": 10.049068450927734, + "mean_norm/layer22": 10.753166139125824, + "mean_norm/layer23": 10.708418011665344, + "mean_norm/layer3": 10.237691342830658, + "mean_norm/layer4": 9.450024247169495, + "mean_norm/layer5": 11.09180212020874, + "mean_norm/layer6": 9.110926032066345, + "mean_norm/layer7": 9.481049478054047, + "mean_norm/layer8": 9.825046956539154, + "mean_norm/layer9": 9.778535842895508, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6050 + }, + { + "epoch": 2.53, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4603294354331699, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7469117641448975, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7837, + "eval_samples_per_second": 20.452, + "eval_steps_per_second": 0.679, + "step": 6050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.55, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6766, + "max_norm": 25.228403091430664, + "max_norm/layer0": 19.683305740356445, + "max_norm/layer1": 21.202486038208008, + "max_norm/layer10": 22.478837966918945, + "max_norm/layer11": 21.12628173828125, + "max_norm/layer12": 22.69508171081543, + "max_norm/layer13": 19.65280532836914, + "max_norm/layer14": 21.235212326049805, + "max_norm/layer15": 24.364246368408203, + "max_norm/layer16": 21.056020736694336, + "max_norm/layer17": 24.269739151000977, + "max_norm/layer18": 21.526058197021484, + "max_norm/layer19": 21.24538230895996, + "max_norm/layer2": 17.323163986206055, + "max_norm/layer20": 22.47141456604004, + "max_norm/layer21": 21.953645706176758, + "max_norm/layer22": 22.524587631225586, + "max_norm/layer23": 21.973390579223633, + "max_norm/layer3": 20.381038665771484, + "max_norm/layer4": 20.474964141845703, + "max_norm/layer5": 25.228403091430664, + "max_norm/layer6": 18.45362663269043, + "max_norm/layer7": 21.947711944580078, + "max_norm/layer8": 22.164188385009766, + "max_norm/layer9": 21.733667373657227, + "mean_norm": 9.966820580263933, + "mean_norm/layer0": 9.493147373199463, + "mean_norm/layer1": 9.51956021785736, + "mean_norm/layer10": 9.861493289470673, + "mean_norm/layer11": 10.082270801067352, + "mean_norm/layer12": 10.42505133152008, + "mean_norm/layer13": 9.8261559009552, + "mean_norm/layer14": 10.130703926086426, + "mean_norm/layer15": 10.350493848323822, + "mean_norm/layer16": 9.909152209758759, + "mean_norm/layer17": 10.298548698425293, + "mean_norm/layer18": 9.976577043533325, + "mean_norm/layer19": 10.002244293689728, + "mean_norm/layer2": 8.620338201522827, + "mean_norm/layer20": 10.106268465518951, + "mean_norm/layer21": 10.06009829044342, + "mean_norm/layer22": 10.768470168113708, + "mean_norm/layer23": 10.723572373390198, + "mean_norm/layer3": 10.250972270965576, + "mean_norm/layer4": 9.458167791366577, + "mean_norm/layer5": 11.110156893730164, + "mean_norm/layer6": 9.117044448852539, + "mean_norm/layer7": 9.489368438720703, + "mean_norm/layer8": 9.835336029529572, + "mean_norm/layer9": 9.788501620292664, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6100 + }, + { + "epoch": 2.55, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4611447090365575, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7434680461883545, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8476, + "eval_samples_per_second": 20.342, + "eval_steps_per_second": 0.675, + "step": 6100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.57, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6922, + "max_norm": 25.344696044921875, + "max_norm/layer0": 19.766042709350586, + "max_norm/layer1": 21.28939437866211, + "max_norm/layer10": 22.563648223876953, + "max_norm/layer11": 21.195743560791016, + "max_norm/layer12": 22.773914337158203, + "max_norm/layer13": 19.732276916503906, + "max_norm/layer14": 21.32152557373047, + "max_norm/layer15": 24.493183135986328, + "max_norm/layer16": 21.16498374938965, + "max_norm/layer17": 24.38330841064453, + "max_norm/layer18": 21.610130310058594, + "max_norm/layer19": 21.38445281982422, + "max_norm/layer2": 17.382400512695312, + "max_norm/layer20": 22.576610565185547, + "max_norm/layer21": 22.033180236816406, + "max_norm/layer22": 22.632516860961914, + "max_norm/layer23": 22.06123161315918, + "max_norm/layer3": 20.473676681518555, + "max_norm/layer4": 20.537517547607422, + "max_norm/layer5": 25.344696044921875, + "max_norm/layer6": 18.493179321289062, + "max_norm/layer7": 22.041973114013672, + "max_norm/layer8": 22.243497848510742, + "max_norm/layer9": 21.801977157592773, + "mean_norm": 9.97796812405189, + "mean_norm/layer0": 9.504401445388794, + "mean_norm/layer1": 9.529353737831116, + "mean_norm/layer10": 9.871827602386475, + "mean_norm/layer11": 10.093893706798553, + "mean_norm/layer12": 10.439537703990936, + "mean_norm/layer13": 9.83659952878952, + "mean_norm/layer14": 10.142653703689575, + "mean_norm/layer15": 10.363728702068329, + "mean_norm/layer16": 9.919947028160095, + "mean_norm/layer17": 10.310964286327362, + "mean_norm/layer18": 9.987221598625183, + "mean_norm/layer19": 10.013190269470215, + "mean_norm/layer2": 8.623740553855896, + "mean_norm/layer20": 10.117258369922638, + "mean_norm/layer21": 10.071050822734833, + "mean_norm/layer22": 10.78360378742218, + "mean_norm/layer23": 10.73860216140747, + "mean_norm/layer3": 10.264272034168243, + "mean_norm/layer4": 9.466197848320007, + "mean_norm/layer5": 11.12835305929184, + "mean_norm/layer6": 9.123260974884033, + "mean_norm/layer7": 9.497576415538788, + "mean_norm/layer8": 9.845619022846222, + "mean_norm/layer9": 9.798380613327026, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6150 + }, + { + "epoch": 2.57, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46083644638055027, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.742943286895752, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5803, + "eval_samples_per_second": 20.811, + "eval_steps_per_second": 0.691, + "step": 6150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.59, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6689, + "max_norm": 25.47237777709961, + "max_norm/layer0": 19.861135482788086, + "max_norm/layer1": 21.369943618774414, + "max_norm/layer10": 22.645503997802734, + "max_norm/layer11": 21.277894973754883, + "max_norm/layer12": 22.86878204345703, + "max_norm/layer13": 19.81595802307129, + "max_norm/layer14": 21.395647048950195, + "max_norm/layer15": 24.607105255126953, + "max_norm/layer16": 21.273733139038086, + "max_norm/layer17": 24.506553649902344, + "max_norm/layer18": 21.704404830932617, + "max_norm/layer19": 21.492938995361328, + "max_norm/layer2": 17.44423484802246, + "max_norm/layer20": 22.680187225341797, + "max_norm/layer21": 22.106203079223633, + "max_norm/layer22": 22.743715286254883, + "max_norm/layer23": 22.155893325805664, + "max_norm/layer3": 20.574127197265625, + "max_norm/layer4": 20.620710372924805, + "max_norm/layer5": 25.47237777709961, + "max_norm/layer6": 18.549198150634766, + "max_norm/layer7": 22.10602569580078, + "max_norm/layer8": 22.323543548583984, + "max_norm/layer9": 21.855295181274414, + "mean_norm": 9.988959466417631, + "mean_norm/layer0": 9.515448808670044, + "mean_norm/layer1": 9.53911018371582, + "mean_norm/layer10": 9.881972074508667, + "mean_norm/layer11": 10.105316400527954, + "mean_norm/layer12": 10.45355623960495, + "mean_norm/layer13": 9.846928358078003, + "mean_norm/layer14": 10.154405415058136, + "mean_norm/layer15": 10.376791179180145, + "mean_norm/layer16": 9.930635511875153, + "mean_norm/layer17": 10.323196768760681, + "mean_norm/layer18": 9.997608542442322, + "mean_norm/layer19": 10.023785591125488, + "mean_norm/layer2": 8.627090692520142, + "mean_norm/layer20": 10.128102242946625, + "mean_norm/layer21": 10.081976056098938, + "mean_norm/layer22": 10.798811733722687, + "mean_norm/layer23": 10.753395140171051, + "mean_norm/layer3": 10.277292788028717, + "mean_norm/layer4": 9.473982751369476, + "mean_norm/layer5": 11.146383464336395, + "mean_norm/layer6": 9.129413843154907, + "mean_norm/layer7": 9.505711376667023, + "mean_norm/layer8": 9.855893790721893, + "mean_norm/layer9": 9.808218240737915, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6200 + }, + { + "epoch": 2.59, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4616557760715169, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.739611864089966, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8022, + "eval_samples_per_second": 20.42, + "eval_steps_per_second": 0.678, + "step": 6200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.61, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6832, + "max_norm": 25.609737396240234, + "max_norm/layer0": 19.959583282470703, + "max_norm/layer1": 21.443889617919922, + "max_norm/layer10": 22.741214752197266, + "max_norm/layer11": 21.409526824951172, + "max_norm/layer12": 22.951099395751953, + "max_norm/layer13": 19.897159576416016, + "max_norm/layer14": 21.47847557067871, + "max_norm/layer15": 24.755695343017578, + "max_norm/layer16": 21.364933013916016, + "max_norm/layer17": 24.639934539794922, + "max_norm/layer18": 21.792865753173828, + "max_norm/layer19": 21.58719825744629, + "max_norm/layer2": 17.523984909057617, + "max_norm/layer20": 22.785497665405273, + "max_norm/layer21": 22.198741912841797, + "max_norm/layer22": 22.869951248168945, + "max_norm/layer23": 22.246004104614258, + "max_norm/layer3": 20.67522430419922, + "max_norm/layer4": 20.69664764404297, + "max_norm/layer5": 25.609737396240234, + "max_norm/layer6": 18.605470657348633, + "max_norm/layer7": 22.189006805419922, + "max_norm/layer8": 22.403486251831055, + "max_norm/layer9": 21.930519104003906, + "mean_norm": 9.9999838595589, + "mean_norm/layer0": 9.526455461978912, + "mean_norm/layer1": 9.548912286758423, + "mean_norm/layer10": 9.892246067523956, + "mean_norm/layer11": 10.116952002048492, + "mean_norm/layer12": 10.467663824558258, + "mean_norm/layer13": 9.857439279556274, + "mean_norm/layer14": 10.166240513324738, + "mean_norm/layer15": 10.390120685100555, + "mean_norm/layer16": 9.941468596458435, + "mean_norm/layer17": 10.335450530052185, + "mean_norm/layer18": 10.008020222187042, + "mean_norm/layer19": 10.034397423267365, + "mean_norm/layer2": 8.630433797836304, + "mean_norm/layer20": 10.139144003391266, + "mean_norm/layer21": 10.092650175094604, + "mean_norm/layer22": 10.813849329948425, + "mean_norm/layer23": 10.767933666706085, + "mean_norm/layer3": 10.290472090244293, + "mean_norm/layer4": 9.481958389282227, + "mean_norm/layer5": 11.164432644844055, + "mean_norm/layer6": 9.135431170463562, + "mean_norm/layer7": 9.513876497745514, + "mean_norm/layer8": 9.866037726402283, + "mean_norm/layer9": 9.81802624464035, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6250 + }, + { + "epoch": 2.61, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46189914132625953, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.735955238342285, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9699, + "eval_samples_per_second": 20.134, + "eval_steps_per_second": 0.668, + "step": 6250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.63, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6732, + "max_norm": 25.74430274963379, + "max_norm/layer0": 20.05502700805664, + "max_norm/layer1": 21.517070770263672, + "max_norm/layer10": 22.837778091430664, + "max_norm/layer11": 21.497528076171875, + "max_norm/layer12": 23.044620513916016, + "max_norm/layer13": 20.000743865966797, + "max_norm/layer14": 21.55751609802246, + "max_norm/layer15": 24.904428482055664, + "max_norm/layer16": 21.46048355102539, + "max_norm/layer17": 24.752845764160156, + "max_norm/layer18": 21.87999725341797, + "max_norm/layer19": 21.66996955871582, + "max_norm/layer2": 17.590194702148438, + "max_norm/layer20": 22.889404296875, + "max_norm/layer21": 22.268436431884766, + "max_norm/layer22": 22.98247718811035, + "max_norm/layer23": 22.344642639160156, + "max_norm/layer3": 20.77219009399414, + "max_norm/layer4": 20.779855728149414, + "max_norm/layer5": 25.74430274963379, + "max_norm/layer6": 18.65287208557129, + "max_norm/layer7": 22.270421981811523, + "max_norm/layer8": 22.518630981445312, + "max_norm/layer9": 22.00423812866211, + "mean_norm": 10.011001144846281, + "mean_norm/layer0": 9.537546277046204, + "mean_norm/layer1": 9.558590412139893, + "mean_norm/layer10": 9.902466833591461, + "mean_norm/layer11": 10.128420174121857, + "mean_norm/layer12": 10.481824576854706, + "mean_norm/layer13": 9.867795050144196, + "mean_norm/layer14": 10.178068697452545, + "mean_norm/layer15": 10.403307795524597, + "mean_norm/layer16": 9.952224373817444, + "mean_norm/layer17": 10.34775185585022, + "mean_norm/layer18": 10.018373608589172, + "mean_norm/layer19": 10.04506230354309, + "mean_norm/layer2": 8.633818507194519, + "mean_norm/layer20": 10.15004014968872, + "mean_norm/layer21": 10.103437781333923, + "mean_norm/layer22": 10.828993797302246, + "mean_norm/layer23": 10.78253710269928, + "mean_norm/layer3": 10.30362993478775, + "mean_norm/layer4": 9.489933848381042, + "mean_norm/layer5": 11.182459115982056, + "mean_norm/layer6": 9.141457200050354, + "mean_norm/layer7": 9.522015750408173, + "mean_norm/layer8": 9.876333832740784, + "mean_norm/layer9": 9.827938497066498, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6300 + }, + { + "epoch": 2.63, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46196809481510326, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.738924503326416, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9635, + "eval_samples_per_second": 20.145, + "eval_steps_per_second": 0.669, + "step": 6300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.65, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6893, + "max_norm": 25.860660552978516, + "max_norm/layer0": 20.153108596801758, + "max_norm/layer1": 21.598623275756836, + "max_norm/layer10": 22.939794540405273, + "max_norm/layer11": 21.61341094970703, + "max_norm/layer12": 23.165863037109375, + "max_norm/layer13": 20.091089248657227, + "max_norm/layer14": 21.64145278930664, + "max_norm/layer15": 25.02685546875, + "max_norm/layer16": 21.53008460998535, + "max_norm/layer17": 24.88070297241211, + "max_norm/layer18": 21.985137939453125, + "max_norm/layer19": 21.748992919921875, + "max_norm/layer2": 17.670303344726562, + "max_norm/layer20": 22.993227005004883, + "max_norm/layer21": 22.341312408447266, + "max_norm/layer22": 23.091922760009766, + "max_norm/layer23": 22.425304412841797, + "max_norm/layer3": 20.88212776184082, + "max_norm/layer4": 20.852691650390625, + "max_norm/layer5": 25.860660552978516, + "max_norm/layer6": 18.694791793823242, + "max_norm/layer7": 22.36998748779297, + "max_norm/layer8": 22.611835479736328, + "max_norm/layer9": 22.073123931884766, + "mean_norm": 10.021994044383367, + "mean_norm/layer0": 9.548484921455383, + "mean_norm/layer1": 9.568365037441254, + "mean_norm/layer10": 9.912571847438812, + "mean_norm/layer11": 10.139825105667114, + "mean_norm/layer12": 10.495871722698212, + "mean_norm/layer13": 9.878227055072784, + "mean_norm/layer14": 10.189821481704712, + "mean_norm/layer15": 10.416566729545593, + "mean_norm/layer16": 9.962967872619629, + "mean_norm/layer17": 10.359967112541199, + "mean_norm/layer18": 10.028738617897034, + "mean_norm/layer19": 10.05587649345398, + "mean_norm/layer2": 8.637226641178131, + "mean_norm/layer20": 10.160935282707214, + "mean_norm/layer21": 10.114270150661469, + "mean_norm/layer22": 10.844156503677368, + "mean_norm/layer23": 10.797121524810791, + "mean_norm/layer3": 10.316659390926361, + "mean_norm/layer4": 9.497858464717865, + "mean_norm/layer5": 11.200486063957214, + "mean_norm/layer6": 9.147541284561157, + "mean_norm/layer7": 9.530200600624084, + "mean_norm/layer8": 9.886442244052887, + "mean_norm/layer9": 9.837674915790558, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6350 + }, + { + "epoch": 2.65, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4616557760715169, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.738407850265503, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.894, + "eval_samples_per_second": 20.262, + "eval_steps_per_second": 0.673, + "step": 6350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.67, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6801, + "max_norm": 25.973201751708984, + "max_norm/layer0": 20.24967384338379, + "max_norm/layer1": 21.692955017089844, + "max_norm/layer10": 23.032072067260742, + "max_norm/layer11": 21.712499618530273, + "max_norm/layer12": 23.234333038330078, + "max_norm/layer13": 20.183149337768555, + "max_norm/layer14": 21.744234085083008, + "max_norm/layer15": 25.175216674804688, + "max_norm/layer16": 21.600980758666992, + "max_norm/layer17": 25.01777458190918, + "max_norm/layer18": 22.099838256835938, + "max_norm/layer19": 21.83799171447754, + "max_norm/layer2": 17.750036239624023, + "max_norm/layer20": 23.09636688232422, + "max_norm/layer21": 22.446022033691406, + "max_norm/layer22": 23.194242477416992, + "max_norm/layer23": 22.509754180908203, + "max_norm/layer3": 20.972686767578125, + "max_norm/layer4": 20.944406509399414, + "max_norm/layer5": 25.973201751708984, + "max_norm/layer6": 18.7388858795166, + "max_norm/layer7": 22.43354606628418, + "max_norm/layer8": 22.72319221496582, + "max_norm/layer9": 22.152870178222656, + "mean_norm": 10.033037247757116, + "mean_norm/layer0": 9.559500932693481, + "mean_norm/layer1": 9.57817429304123, + "mean_norm/layer10": 9.92283582687378, + "mean_norm/layer11": 10.151250958442688, + "mean_norm/layer12": 10.510083556175232, + "mean_norm/layer13": 9.888749897480011, + "mean_norm/layer14": 10.201764583587646, + "mean_norm/layer15": 10.429744482040405, + "mean_norm/layer16": 9.973683893680573, + "mean_norm/layer17": 10.372322142124176, + "mean_norm/layer18": 10.039182603359222, + "mean_norm/layer19": 10.066715955734253, + "mean_norm/layer2": 8.640654444694519, + "mean_norm/layer20": 10.171599209308624, + "mean_norm/layer21": 10.125025808811188, + "mean_norm/layer22": 10.859051883220673, + "mean_norm/layer23": 10.811841130256653, + "mean_norm/layer3": 10.329941034317017, + "mean_norm/layer4": 9.505902767181396, + "mean_norm/layer5": 11.218784868717194, + "mean_norm/layer6": 9.153590142726898, + "mean_norm/layer7": 9.538390636444092, + "mean_norm/layer8": 9.896606981754303, + "mean_norm/layer9": 9.847495913505554, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6400 + }, + { + "epoch": 2.67, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.462511610550695, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.732863664627075, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8118, + "eval_samples_per_second": 20.403, + "eval_steps_per_second": 0.677, + "step": 6400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.69, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6817, + "max_norm": 26.08163070678711, + "max_norm/layer0": 20.342599868774414, + "max_norm/layer1": 21.786935806274414, + "max_norm/layer10": 23.1118106842041, + "max_norm/layer11": 21.78784942626953, + "max_norm/layer12": 23.314739227294922, + "max_norm/layer13": 20.244739532470703, + "max_norm/layer14": 21.830318450927734, + "max_norm/layer15": 25.3209228515625, + "max_norm/layer16": 21.691482543945312, + "max_norm/layer17": 25.14759063720703, + "max_norm/layer18": 22.2069034576416, + "max_norm/layer19": 21.922334671020508, + "max_norm/layer2": 17.808311462402344, + "max_norm/layer20": 23.185317993164062, + "max_norm/layer21": 22.515777587890625, + "max_norm/layer22": 23.288124084472656, + "max_norm/layer23": 22.597469329833984, + "max_norm/layer3": 21.05324363708496, + "max_norm/layer4": 21.01177215576172, + "max_norm/layer5": 26.08163070678711, + "max_norm/layer6": 18.78575325012207, + "max_norm/layer7": 22.506237030029297, + "max_norm/layer8": 22.81680679321289, + "max_norm/layer9": 22.22559928894043, + "mean_norm": 10.043887262543043, + "mean_norm/layer0": 9.570309102535248, + "mean_norm/layer1": 9.587825655937195, + "mean_norm/layer10": 9.932947993278503, + "mean_norm/layer11": 10.162622213363647, + "mean_norm/layer12": 10.524069786071777, + "mean_norm/layer13": 9.899032413959503, + "mean_norm/layer14": 10.213397681713104, + "mean_norm/layer15": 10.44272756576538, + "mean_norm/layer16": 9.984095215797424, + "mean_norm/layer17": 10.38427847623825, + "mean_norm/layer18": 10.049458801746368, + "mean_norm/layer19": 10.07730907201767, + "mean_norm/layer2": 8.64402985572815, + "mean_norm/layer20": 10.182213187217712, + "mean_norm/layer21": 10.135670959949493, + "mean_norm/layer22": 10.873790740966797, + "mean_norm/layer23": 10.826238214969635, + "mean_norm/layer3": 10.342928886413574, + "mean_norm/layer4": 9.513796925544739, + "mean_norm/layer5": 11.236631333827972, + "mean_norm/layer6": 9.159627318382263, + "mean_norm/layer7": 9.546464681625366, + "mean_norm/layer8": 9.906689047813416, + "mean_norm/layer9": 9.85713917016983, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6450 + }, + { + "epoch": 2.69, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4634282863435587, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7291603088378906, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9312, + "eval_samples_per_second": 22.047, + "eval_steps_per_second": 0.732, + "step": 6450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.71, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6874, + "max_norm": 26.185462951660156, + "max_norm/layer0": 20.429880142211914, + "max_norm/layer1": 21.891557693481445, + "max_norm/layer10": 23.196739196777344, + "max_norm/layer11": 21.859304428100586, + "max_norm/layer12": 23.41972541809082, + "max_norm/layer13": 20.317655563354492, + "max_norm/layer14": 21.93121337890625, + "max_norm/layer15": 25.443115234375, + "max_norm/layer16": 21.796695709228516, + "max_norm/layer17": 25.274187088012695, + "max_norm/layer18": 22.326488494873047, + "max_norm/layer19": 22.01841163635254, + "max_norm/layer2": 17.86547088623047, + "max_norm/layer20": 23.280214309692383, + "max_norm/layer21": 22.618255615234375, + "max_norm/layer22": 23.38398551940918, + "max_norm/layer23": 22.68142318725586, + "max_norm/layer3": 21.130823135375977, + "max_norm/layer4": 21.080659866333008, + "max_norm/layer5": 26.185462951660156, + "max_norm/layer6": 18.8240909576416, + "max_norm/layer7": 22.595474243164062, + "max_norm/layer8": 22.909751892089844, + "max_norm/layer9": 22.31151008605957, + "mean_norm": 10.054706205924353, + "mean_norm/layer0": 9.581124305725098, + "mean_norm/layer1": 9.597380995750427, + "mean_norm/layer10": 9.9429412484169, + "mean_norm/layer11": 10.173977673053741, + "mean_norm/layer12": 10.537902593612671, + "mean_norm/layer13": 9.909233927726746, + "mean_norm/layer14": 10.225030422210693, + "mean_norm/layer15": 10.455805003643036, + "mean_norm/layer16": 9.994404911994934, + "mean_norm/layer17": 10.396243751049042, + "mean_norm/layer18": 10.059688329696655, + "mean_norm/layer19": 10.08789175748825, + "mean_norm/layer2": 8.647391676902771, + "mean_norm/layer20": 10.192969799041748, + "mean_norm/layer21": 10.14613652229309, + "mean_norm/layer22": 10.88859474658966, + "mean_norm/layer23": 10.8405082821846, + "mean_norm/layer3": 10.355776727199554, + "mean_norm/layer4": 9.52163827419281, + "mean_norm/layer5": 11.25450748205185, + "mean_norm/layer6": 9.165621161460876, + "mean_norm/layer7": 9.554507315158844, + "mean_norm/layer8": 9.916891932487488, + "mean_norm/layer9": 9.86678010225296, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6500 + }, + { + "epoch": 2.71, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4635580811460881, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.728681802749634, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9589, + "eval_samples_per_second": 20.152, + "eval_steps_per_second": 0.669, + "step": 6500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.73, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.679, + "max_norm": 26.300392150878906, + "max_norm/layer0": 20.514989852905273, + "max_norm/layer1": 21.97933006286621, + "max_norm/layer10": 23.27261734008789, + "max_norm/layer11": 21.926321029663086, + "max_norm/layer12": 23.4990291595459, + "max_norm/layer13": 20.39130210876465, + "max_norm/layer14": 22.02625274658203, + "max_norm/layer15": 25.556787490844727, + "max_norm/layer16": 21.871458053588867, + "max_norm/layer17": 25.401857376098633, + "max_norm/layer18": 22.435489654541016, + "max_norm/layer19": 22.1010684967041, + "max_norm/layer2": 17.91828727722168, + "max_norm/layer20": 23.372716903686523, + "max_norm/layer21": 22.709657669067383, + "max_norm/layer22": 23.478649139404297, + "max_norm/layer23": 22.77086067199707, + "max_norm/layer3": 21.2097110748291, + "max_norm/layer4": 21.154205322265625, + "max_norm/layer5": 26.300392150878906, + "max_norm/layer6": 18.872074127197266, + "max_norm/layer7": 22.68345832824707, + "max_norm/layer8": 23.019010543823242, + "max_norm/layer9": 22.39520263671875, + "mean_norm": 10.065300052364668, + "mean_norm/layer0": 9.591688811779022, + "mean_norm/layer1": 9.60675710439682, + "mean_norm/layer10": 9.95275890827179, + "mean_norm/layer11": 10.185077250003815, + "mean_norm/layer12": 10.55156809091568, + "mean_norm/layer13": 9.919322490692139, + "mean_norm/layer14": 10.236485064029694, + "mean_norm/layer15": 10.468361973762512, + "mean_norm/layer16": 10.004529654979706, + "mean_norm/layer17": 10.407990336418152, + "mean_norm/layer18": 10.069653689861298, + "mean_norm/layer19": 10.098095178604126, + "mean_norm/layer2": 8.650662422180176, + "mean_norm/layer20": 10.203266143798828, + "mean_norm/layer21": 10.156417906284332, + "mean_norm/layer22": 10.903109967708588, + "mean_norm/layer23": 10.854621052742004, + "mean_norm/layer3": 10.368398368358612, + "mean_norm/layer4": 9.529488384723663, + "mean_norm/layer5": 11.272061467170715, + "mean_norm/layer6": 9.17146784067154, + "mean_norm/layer7": 9.562333583831787, + "mean_norm/layer8": 9.926826179027557, + "mean_norm/layer9": 9.87625938653946, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6550 + }, + { + "epoch": 2.73, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46354591288335095, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7235679626464844, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9943, + "eval_samples_per_second": 20.093, + "eval_steps_per_second": 0.667, + "step": 6550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.76, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6811, + "max_norm": 26.41242790222168, + "max_norm/layer0": 20.60313606262207, + "max_norm/layer1": 22.07373046875, + "max_norm/layer10": 23.349884033203125, + "max_norm/layer11": 21.98993682861328, + "max_norm/layer12": 23.584455490112305, + "max_norm/layer13": 20.48732566833496, + "max_norm/layer14": 22.116924285888672, + "max_norm/layer15": 25.71857261657715, + "max_norm/layer16": 21.94927978515625, + "max_norm/layer17": 25.516101837158203, + "max_norm/layer18": 22.543033599853516, + "max_norm/layer19": 22.182836532592773, + "max_norm/layer2": 17.969606399536133, + "max_norm/layer20": 23.472898483276367, + "max_norm/layer21": 22.797204971313477, + "max_norm/layer22": 23.56959342956543, + "max_norm/layer23": 22.859933853149414, + "max_norm/layer3": 21.289579391479492, + "max_norm/layer4": 21.220144271850586, + "max_norm/layer5": 26.41242790222168, + "max_norm/layer6": 18.920167922973633, + "max_norm/layer7": 22.76586151123047, + "max_norm/layer8": 23.115718841552734, + "max_norm/layer9": 22.4892635345459, + "mean_norm": 10.076057064036528, + "mean_norm/layer0": 9.602395057678223, + "mean_norm/layer1": 9.616295576095581, + "mean_norm/layer10": 9.962799191474915, + "mean_norm/layer11": 10.196372210979462, + "mean_norm/layer12": 10.565538883209229, + "mean_norm/layer13": 9.929556131362915, + "mean_norm/layer14": 10.248076438903809, + "mean_norm/layer15": 10.481202960014343, + "mean_norm/layer16": 10.014976143836975, + "mean_norm/layer17": 10.419837892055511, + "mean_norm/layer18": 10.079734206199646, + "mean_norm/layer19": 10.108431100845337, + "mean_norm/layer2": 8.654021739959717, + "mean_norm/layer20": 10.213871002197266, + "mean_norm/layer21": 10.167028248310089, + "mean_norm/layer22": 10.917715430259705, + "mean_norm/layer23": 10.86873722076416, + "mean_norm/layer3": 10.381210148334503, + "mean_norm/layer4": 9.537363827228546, + "mean_norm/layer5": 11.289835691452026, + "mean_norm/layer6": 9.177374601364136, + "mean_norm/layer7": 9.570362865924835, + "mean_norm/layer8": 9.93681263923645, + "mean_norm/layer9": 9.8858203291893, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6600 + }, + { + "epoch": 2.76, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4633228280665036, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7256357669830322, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9601, + "eval_samples_per_second": 21.989, + "eval_steps_per_second": 0.73, + "step": 6600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.78, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6643, + "max_norm": 26.53062629699707, + "max_norm/layer0": 20.69165802001953, + "max_norm/layer1": 22.169431686401367, + "max_norm/layer10": 23.433088302612305, + "max_norm/layer11": 22.052358627319336, + "max_norm/layer12": 23.695178985595703, + "max_norm/layer13": 20.58042335510254, + "max_norm/layer14": 22.196151733398438, + "max_norm/layer15": 25.866147994995117, + "max_norm/layer16": 22.042850494384766, + "max_norm/layer17": 25.626388549804688, + "max_norm/layer18": 22.655969619750977, + "max_norm/layer19": 22.26487159729004, + "max_norm/layer2": 18.044330596923828, + "max_norm/layer20": 23.553281784057617, + "max_norm/layer21": 22.87949562072754, + "max_norm/layer22": 23.65622901916504, + "max_norm/layer23": 22.95343589782715, + "max_norm/layer3": 21.365331649780273, + "max_norm/layer4": 21.279878616333008, + "max_norm/layer5": 26.53062629699707, + "max_norm/layer6": 18.96720314025879, + "max_norm/layer7": 22.85620880126953, + "max_norm/layer8": 23.207963943481445, + "max_norm/layer9": 22.580841064453125, + "mean_norm": 10.086789600551128, + "mean_norm/layer0": 9.613000214099884, + "mean_norm/layer1": 9.625762045383453, + "mean_norm/layer10": 9.97273999452591, + "mean_norm/layer11": 10.207618951797485, + "mean_norm/layer12": 10.579367339611053, + "mean_norm/layer13": 9.939832985401154, + "mean_norm/layer14": 10.259712278842926, + "mean_norm/layer15": 10.494081377983093, + "mean_norm/layer16": 10.025314569473267, + "mean_norm/layer17": 10.431630611419678, + "mean_norm/layer18": 10.089784562587738, + "mean_norm/layer19": 10.11875718832016, + "mean_norm/layer2": 8.65731281042099, + "mean_norm/layer20": 10.224305629730225, + "mean_norm/layer21": 10.177746534347534, + "mean_norm/layer22": 10.93244206905365, + "mean_norm/layer23": 10.883185744285583, + "mean_norm/layer3": 10.393769443035126, + "mean_norm/layer4": 9.54505968093872, + "mean_norm/layer5": 11.307492792606354, + "mean_norm/layer6": 9.183353424072266, + "mean_norm/layer7": 9.578372538089752, + "mean_norm/layer8": 9.946847558021545, + "mean_norm/layer9": 9.895460069179535, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6650 + }, + { + "epoch": 2.78, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.464113765144417, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7235653400421143, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9913, + "eval_samples_per_second": 21.927, + "eval_steps_per_second": 0.728, + "step": 6650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.8, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6876, + "max_norm": 26.64914894104004, + "max_norm/layer0": 20.784852981567383, + "max_norm/layer1": 22.261592864990234, + "max_norm/layer10": 23.51398277282715, + "max_norm/layer11": 22.147192001342773, + "max_norm/layer12": 23.818450927734375, + "max_norm/layer13": 20.655099868774414, + "max_norm/layer14": 22.267887115478516, + "max_norm/layer15": 25.970462799072266, + "max_norm/layer16": 22.135021209716797, + "max_norm/layer17": 25.742647171020508, + "max_norm/layer18": 22.75875473022461, + "max_norm/layer19": 22.36121368408203, + "max_norm/layer2": 18.096092224121094, + "max_norm/layer20": 23.627822875976562, + "max_norm/layer21": 22.97427749633789, + "max_norm/layer22": 23.749114990234375, + "max_norm/layer23": 23.046504974365234, + "max_norm/layer3": 21.45503044128418, + "max_norm/layer4": 21.35271453857422, + "max_norm/layer5": 26.64914894104004, + "max_norm/layer6": 19.017742156982422, + "max_norm/layer7": 22.955495834350586, + "max_norm/layer8": 23.273195266723633, + "max_norm/layer9": 22.669376373291016, + "mean_norm": 10.09744872401158, + "mean_norm/layer0": 9.623487830162048, + "mean_norm/layer1": 9.635239779949188, + "mean_norm/layer10": 9.982640266418457, + "mean_norm/layer11": 10.218821167945862, + "mean_norm/layer12": 10.593107223510742, + "mean_norm/layer13": 9.950129866600037, + "mean_norm/layer14": 10.271190285682678, + "mean_norm/layer15": 10.50691831111908, + "mean_norm/layer16": 10.035589933395386, + "mean_norm/layer17": 10.443416774272919, + "mean_norm/layer18": 10.099798321723938, + "mean_norm/layer19": 10.12911069393158, + "mean_norm/layer2": 8.660598039627075, + "mean_norm/layer20": 10.234609246253967, + "mean_norm/layer21": 10.188297629356384, + "mean_norm/layer22": 10.946758568286896, + "mean_norm/layer23": 10.897278547286987, + "mean_norm/layer3": 10.406484246253967, + "mean_norm/layer4": 9.55282211303711, + "mean_norm/layer5": 11.324999570846558, + "mean_norm/layer6": 9.18930995464325, + "mean_norm/layer7": 9.58632493019104, + "mean_norm/layer8": 9.956737279891968, + "mean_norm/layer9": 9.905098795890808, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6700 + }, + { + "epoch": 2.8, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4638582316269373, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7227768898010254, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9561, + "eval_samples_per_second": 20.157, + "eval_steps_per_second": 0.669, + "step": 6700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.82, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6642, + "max_norm": 26.773120880126953, + "max_norm/layer0": 20.875125885009766, + "max_norm/layer1": 22.349252700805664, + "max_norm/layer10": 23.591472625732422, + "max_norm/layer11": 22.24338150024414, + "max_norm/layer12": 23.943801879882812, + "max_norm/layer13": 20.728654861450195, + "max_norm/layer14": 22.363893508911133, + "max_norm/layer15": 26.09659194946289, + "max_norm/layer16": 22.210033416748047, + "max_norm/layer17": 25.849321365356445, + "max_norm/layer18": 22.857954025268555, + "max_norm/layer19": 22.457433700561523, + "max_norm/layer2": 18.137813568115234, + "max_norm/layer20": 23.715415954589844, + "max_norm/layer21": 23.066875457763672, + "max_norm/layer22": 23.838668823242188, + "max_norm/layer23": 23.13340950012207, + "max_norm/layer3": 21.559398651123047, + "max_norm/layer4": 21.422008514404297, + "max_norm/layer5": 26.773120880126953, + "max_norm/layer6": 19.059314727783203, + "max_norm/layer7": 23.055139541625977, + "max_norm/layer8": 23.34084701538086, + "max_norm/layer9": 22.744380950927734, + "mean_norm": 10.108140423893929, + "mean_norm/layer0": 9.634041845798492, + "mean_norm/layer1": 9.64472496509552, + "mean_norm/layer10": 9.992616534233093, + "mean_norm/layer11": 10.230005323886871, + "mean_norm/layer12": 10.606897294521332, + "mean_norm/layer13": 9.960363149642944, + "mean_norm/layer14": 10.282639801502228, + "mean_norm/layer15": 10.519710779190063, + "mean_norm/layer16": 10.045837819576263, + "mean_norm/layer17": 10.455260336399078, + "mean_norm/layer18": 10.109922409057617, + "mean_norm/layer19": 10.13957166671753, + "mean_norm/layer2": 8.663931012153625, + "mean_norm/layer20": 10.244955360889435, + "mean_norm/layer21": 10.198612809181213, + "mean_norm/layer22": 10.961101591587067, + "mean_norm/layer23": 10.911440670490265, + "mean_norm/layer3": 10.419304966926575, + "mean_norm/layer4": 9.560689806938171, + "mean_norm/layer5": 11.342604517936707, + "mean_norm/layer6": 9.19537079334259, + "mean_norm/layer7": 9.594294905662537, + "mean_norm/layer8": 9.96668291091919, + "mean_norm/layer9": 9.914788901805878, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6750 + }, + { + "epoch": 2.82, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46477896350738007, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.719167470932007, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9754, + "eval_samples_per_second": 20.125, + "eval_steps_per_second": 0.668, + "step": 6750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.84, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6727, + "max_norm": 26.90037727355957, + "max_norm/layer0": 20.969045639038086, + "max_norm/layer1": 22.430818557739258, + "max_norm/layer10": 23.685087203979492, + "max_norm/layer11": 22.313629150390625, + "max_norm/layer12": 24.071069717407227, + "max_norm/layer13": 20.809654235839844, + "max_norm/layer14": 22.459442138671875, + "max_norm/layer15": 26.201696395874023, + "max_norm/layer16": 22.303298950195312, + "max_norm/layer17": 25.975738525390625, + "max_norm/layer18": 22.961307525634766, + "max_norm/layer19": 22.554285049438477, + "max_norm/layer2": 18.194622039794922, + "max_norm/layer20": 23.812129974365234, + "max_norm/layer21": 23.155019760131836, + "max_norm/layer22": 23.927391052246094, + "max_norm/layer23": 23.213560104370117, + "max_norm/layer3": 21.650287628173828, + "max_norm/layer4": 21.503629684448242, + "max_norm/layer5": 26.90037727355957, + "max_norm/layer6": 19.09876251220703, + "max_norm/layer7": 23.141084671020508, + "max_norm/layer8": 23.412324905395508, + "max_norm/layer9": 22.814966201782227, + "mean_norm": 10.118629676600298, + "mean_norm/layer0": 9.644381642341614, + "mean_norm/layer1": 9.654210925102234, + "mean_norm/layer10": 10.002406060695648, + "mean_norm/layer11": 10.240853428840637, + "mean_norm/layer12": 10.620422959327698, + "mean_norm/layer13": 9.970386505126953, + "mean_norm/layer14": 10.293885469436646, + "mean_norm/layer15": 10.53236836194992, + "mean_norm/layer16": 10.055989801883698, + "mean_norm/layer17": 10.4669588804245, + "mean_norm/layer18": 10.119860827922821, + "mean_norm/layer19": 10.14971262216568, + "mean_norm/layer2": 8.667130768299103, + "mean_norm/layer20": 10.255202949047089, + "mean_norm/layer21": 10.208835124969482, + "mean_norm/layer22": 10.975344359874725, + "mean_norm/layer23": 10.925430059432983, + "mean_norm/layer3": 10.431658208370209, + "mean_norm/layer4": 9.568336188793182, + "mean_norm/layer5": 11.35985416173935, + "mean_norm/layer6": 9.201176106929779, + "mean_norm/layer7": 9.60221016407013, + "mean_norm/layer8": 9.976355135440826, + "mean_norm/layer9": 9.924141526222229, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6800 + }, + { + "epoch": 2.84, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46521296487833763, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7178404331207275, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 12.0017, + "eval_samples_per_second": 20.08, + "eval_steps_per_second": 0.667, + "step": 6800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.86, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6807, + "max_norm": 27.022308349609375, + "max_norm/layer0": 21.06038475036621, + "max_norm/layer1": 22.520341873168945, + "max_norm/layer10": 23.770435333251953, + "max_norm/layer11": 22.414648056030273, + "max_norm/layer12": 24.182048797607422, + "max_norm/layer13": 20.879291534423828, + "max_norm/layer14": 22.538923263549805, + "max_norm/layer15": 26.301652908325195, + "max_norm/layer16": 22.408843994140625, + "max_norm/layer17": 26.084640502929688, + "max_norm/layer18": 23.061779022216797, + "max_norm/layer19": 22.65226936340332, + "max_norm/layer2": 18.260866165161133, + "max_norm/layer20": 23.915470123291016, + "max_norm/layer21": 23.253692626953125, + "max_norm/layer22": 24.023237228393555, + "max_norm/layer23": 23.293275833129883, + "max_norm/layer3": 21.75033187866211, + "max_norm/layer4": 21.58634376525879, + "max_norm/layer5": 27.022308349609375, + "max_norm/layer6": 19.1436824798584, + "max_norm/layer7": 23.238664627075195, + "max_norm/layer8": 23.49786949157715, + "max_norm/layer9": 22.880979537963867, + "mean_norm": 10.129067420959473, + "mean_norm/layer0": 9.65470838546753, + "mean_norm/layer1": 9.663567900657654, + "mean_norm/layer10": 10.012172758579254, + "mean_norm/layer11": 10.251695156097412, + "mean_norm/layer12": 10.633814513683319, + "mean_norm/layer13": 9.980302691459656, + "mean_norm/layer14": 10.304986953735352, + "mean_norm/layer15": 10.544901430606842, + "mean_norm/layer16": 10.066105425357819, + "mean_norm/layer17": 10.478527903556824, + "mean_norm/layer18": 10.129638016223907, + "mean_norm/layer19": 10.159819066524506, + "mean_norm/layer2": 8.67033064365387, + "mean_norm/layer20": 10.265411257743835, + "mean_norm/layer21": 10.219161748886108, + "mean_norm/layer22": 10.989376246929169, + "mean_norm/layer23": 10.939277946949005, + "mean_norm/layer3": 10.444223880767822, + "mean_norm/layer4": 9.575941681861877, + "mean_norm/layer5": 11.377063035964966, + "mean_norm/layer6": 9.207095921039581, + "mean_norm/layer7": 9.61001867055893, + "mean_norm/layer8": 9.98603469133377, + "mean_norm/layer9": 9.933442175388336, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6850 + }, + { + "epoch": 2.86, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46436524257431766, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7178053855895996, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 12.0365, + "eval_samples_per_second": 20.022, + "eval_steps_per_second": 0.665, + "step": 6850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.88, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6681, + "max_norm": 27.13735580444336, + "max_norm/layer0": 21.155269622802734, + "max_norm/layer1": 22.60647964477539, + "max_norm/layer10": 23.85950469970703, + "max_norm/layer11": 22.502986907958984, + "max_norm/layer12": 24.27869415283203, + "max_norm/layer13": 20.957544326782227, + "max_norm/layer14": 22.631610870361328, + "max_norm/layer15": 26.41908836364746, + "max_norm/layer16": 22.488388061523438, + "max_norm/layer17": 26.20008659362793, + "max_norm/layer18": 23.15396499633789, + "max_norm/layer19": 22.744834899902344, + "max_norm/layer2": 18.32578468322754, + "max_norm/layer20": 24.02092933654785, + "max_norm/layer21": 23.352216720581055, + "max_norm/layer22": 24.124401092529297, + "max_norm/layer23": 23.385162353515625, + "max_norm/layer3": 21.84356117248535, + "max_norm/layer4": 21.661521911621094, + "max_norm/layer5": 27.13735580444336, + "max_norm/layer6": 19.194093704223633, + "max_norm/layer7": 23.325639724731445, + "max_norm/layer8": 23.56928253173828, + "max_norm/layer9": 22.95269203186035, + "mean_norm": 10.139540493488312, + "mean_norm/layer0": 9.665144145488739, + "mean_norm/layer1": 9.672926366329193, + "mean_norm/layer10": 10.022092461585999, + "mean_norm/layer11": 10.262580275535583, + "mean_norm/layer12": 10.647343635559082, + "mean_norm/layer13": 9.990399658679962, + "mean_norm/layer14": 10.316211938858032, + "mean_norm/layer15": 10.557567954063416, + "mean_norm/layer16": 10.07616525888443, + "mean_norm/layer17": 10.490152776241302, + "mean_norm/layer18": 10.139376282691956, + "mean_norm/layer19": 10.169822752475739, + "mean_norm/layer2": 8.673572421073914, + "mean_norm/layer20": 10.275636315345764, + "mean_norm/layer21": 10.229391396045685, + "mean_norm/layer22": 11.003340423107147, + "mean_norm/layer23": 10.952987730503082, + "mean_norm/layer3": 10.456810116767883, + "mean_norm/layer4": 9.58361804485321, + "mean_norm/layer5": 11.394310891628265, + "mean_norm/layer6": 9.212887942790985, + "mean_norm/layer7": 9.617939710617065, + "mean_norm/layer8": 9.995769262313843, + "mean_norm/layer9": 9.942924082279205, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6900 + }, + { + "epoch": 2.88, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46391096076546484, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7232961654663086, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9728, + "eval_samples_per_second": 20.129, + "eval_steps_per_second": 0.668, + "step": 6900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.9, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.683, + "max_norm": 27.246826171875, + "max_norm/layer0": 21.23979949951172, + "max_norm/layer1": 22.690458297729492, + "max_norm/layer10": 23.941022872924805, + "max_norm/layer11": 22.600021362304688, + "max_norm/layer12": 24.37978744506836, + "max_norm/layer13": 21.041887283325195, + "max_norm/layer14": 22.723411560058594, + "max_norm/layer15": 26.524131774902344, + "max_norm/layer16": 22.572383880615234, + "max_norm/layer17": 26.303722381591797, + "max_norm/layer18": 23.273639678955078, + "max_norm/layer19": 22.84536361694336, + "max_norm/layer2": 18.371814727783203, + "max_norm/layer20": 24.109756469726562, + "max_norm/layer21": 23.438453674316406, + "max_norm/layer22": 24.226545333862305, + "max_norm/layer23": 23.486717224121094, + "max_norm/layer3": 21.92794418334961, + "max_norm/layer4": 21.739208221435547, + "max_norm/layer5": 27.246826171875, + "max_norm/layer6": 19.241615295410156, + "max_norm/layer7": 23.398082733154297, + "max_norm/layer8": 23.666467666625977, + "max_norm/layer9": 23.0317325592041, + "mean_norm": 10.149980219701925, + "mean_norm/layer0": 9.675594747066498, + "mean_norm/layer1": 9.682190597057343, + "mean_norm/layer10": 10.031827569007874, + "mean_norm/layer11": 10.273438334465027, + "mean_norm/layer12": 10.660808444023132, + "mean_norm/layer13": 10.000330448150635, + "mean_norm/layer14": 10.327272832393646, + "mean_norm/layer15": 10.57010704278946, + "mean_norm/layer16": 10.08619076013565, + "mean_norm/layer17": 10.501644492149353, + "mean_norm/layer18": 10.1490837931633, + "mean_norm/layer19": 10.179917216300964, + "mean_norm/layer2": 8.676787793636322, + "mean_norm/layer20": 10.285813570022583, + "mean_norm/layer21": 10.239711225032806, + "mean_norm/layer22": 11.01748389005661, + "mean_norm/layer23": 10.966828763484955, + "mean_norm/layer3": 10.469435572624207, + "mean_norm/layer4": 9.591278553009033, + "mean_norm/layer5": 11.41142475605011, + "mean_norm/layer6": 9.218688607215881, + "mean_norm/layer7": 9.625806748867035, + "mean_norm/layer8": 10.005479514598846, + "mean_norm/layer9": 9.952380001544952, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 6950 + }, + { + "epoch": 2.9, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46421111124631403, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7184746265411377, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9605, + "eval_samples_per_second": 20.15, + "eval_steps_per_second": 0.669, + "step": 6950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.92, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6739, + "max_norm": 27.365013122558594, + "max_norm/layer0": 21.320209503173828, + "max_norm/layer1": 22.772533416748047, + "max_norm/layer10": 24.037193298339844, + "max_norm/layer11": 22.68212890625, + "max_norm/layer12": 24.47044563293457, + "max_norm/layer13": 21.140518188476562, + "max_norm/layer14": 22.791292190551758, + "max_norm/layer15": 26.62784194946289, + "max_norm/layer16": 22.64996910095215, + "max_norm/layer17": 26.407562255859375, + "max_norm/layer18": 23.370203018188477, + "max_norm/layer19": 22.947025299072266, + "max_norm/layer2": 18.42116355895996, + "max_norm/layer20": 24.20484733581543, + "max_norm/layer21": 23.53941535949707, + "max_norm/layer22": 24.325706481933594, + "max_norm/layer23": 23.589479446411133, + "max_norm/layer3": 21.999433517456055, + "max_norm/layer4": 21.819570541381836, + "max_norm/layer5": 27.365013122558594, + "max_norm/layer6": 19.291427612304688, + "max_norm/layer7": 23.481708526611328, + "max_norm/layer8": 23.764585494995117, + "max_norm/layer9": 23.106569290161133, + "mean_norm": 10.160274868210157, + "mean_norm/layer0": 9.685955584049225, + "mean_norm/layer1": 9.691339433193207, + "mean_norm/layer10": 10.041491627693176, + "mean_norm/layer11": 10.284164071083069, + "mean_norm/layer12": 10.674180507659912, + "mean_norm/layer13": 10.010160326957703, + "mean_norm/layer14": 10.338261485099792, + "mean_norm/layer15": 10.582512021064758, + "mean_norm/layer16": 10.096154391765594, + "mean_norm/layer17": 10.513055503368378, + "mean_norm/layer18": 10.158551752567291, + "mean_norm/layer19": 10.189700782299042, + "mean_norm/layer2": 8.67995148897171, + "mean_norm/layer20": 10.295816540718079, + "mean_norm/layer21": 10.249844431877136, + "mean_norm/layer22": 11.031257331371307, + "mean_norm/layer23": 10.980518758296967, + "mean_norm/layer3": 10.481708467006683, + "mean_norm/layer4": 9.598879992961884, + "mean_norm/layer5": 11.428387343883514, + "mean_norm/layer6": 9.224398612976074, + "mean_norm/layer7": 9.633533835411072, + "mean_norm/layer8": 10.015078723430634, + "mean_norm/layer9": 9.961693823337555, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7000 + }, + { + "epoch": 2.92, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4648519730838028, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.71905255317688, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 12.0164, + "eval_samples_per_second": 20.056, + "eval_steps_per_second": 0.666, + "step": 7000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.94, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6601, + "max_norm": 27.486360549926758, + "max_norm/layer0": 21.405040740966797, + "max_norm/layer1": 22.844478607177734, + "max_norm/layer10": 24.13811683654785, + "max_norm/layer11": 22.76434326171875, + "max_norm/layer12": 24.57598304748535, + "max_norm/layer13": 21.21640396118164, + "max_norm/layer14": 22.89393424987793, + "max_norm/layer15": 26.729122161865234, + "max_norm/layer16": 22.737476348876953, + "max_norm/layer17": 26.515493392944336, + "max_norm/layer18": 23.493305206298828, + "max_norm/layer19": 23.048307418823242, + "max_norm/layer2": 18.475828170776367, + "max_norm/layer20": 24.307435989379883, + "max_norm/layer21": 23.62061882019043, + "max_norm/layer22": 24.448505401611328, + "max_norm/layer23": 23.68608856201172, + "max_norm/layer3": 22.074338912963867, + "max_norm/layer4": 21.888811111450195, + "max_norm/layer5": 27.486360549926758, + "max_norm/layer6": 19.338953018188477, + "max_norm/layer7": 23.5861759185791, + "max_norm/layer8": 23.85187530517578, + "max_norm/layer9": 23.19942855834961, + "mean_norm": 10.170738401512304, + "mean_norm/layer0": 9.69635421037674, + "mean_norm/layer1": 9.700594305992126, + "mean_norm/layer10": 10.051340162754059, + "mean_norm/layer11": 10.295095443725586, + "mean_norm/layer12": 10.687723755836487, + "mean_norm/layer13": 10.02021598815918, + "mean_norm/layer14": 10.349409282207489, + "mean_norm/layer15": 10.595264911651611, + "mean_norm/layer16": 10.106310904026031, + "mean_norm/layer17": 10.52473098039627, + "mean_norm/layer18": 10.168320178985596, + "mean_norm/layer19": 10.199616312980652, + "mean_norm/layer2": 8.683153092861176, + "mean_norm/layer20": 10.306044220924377, + "mean_norm/layer21": 10.260170817375183, + "mean_norm/layer22": 11.045268595218658, + "mean_norm/layer23": 10.994395852088928, + "mean_norm/layer3": 10.494205713272095, + "mean_norm/layer4": 9.606450021266937, + "mean_norm/layer5": 11.445621371269226, + "mean_norm/layer6": 9.230290651321411, + "mean_norm/layer7": 9.641353845596313, + "mean_norm/layer8": 10.02471512556076, + "mean_norm/layer9": 9.971075892448425, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7050 + }, + { + "epoch": 2.94, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46439769127495, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7168571949005127, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8316, + "eval_samples_per_second": 20.369, + "eval_steps_per_second": 0.676, + "step": 7050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.96, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.675, + "max_norm": 27.602540969848633, + "max_norm/layer0": 21.484041213989258, + "max_norm/layer1": 22.924697875976562, + "max_norm/layer10": 24.247194290161133, + "max_norm/layer11": 22.84771156311035, + "max_norm/layer12": 24.685514450073242, + "max_norm/layer13": 21.300878524780273, + "max_norm/layer14": 22.97532844543457, + "max_norm/layer15": 26.83058738708496, + "max_norm/layer16": 22.808544158935547, + "max_norm/layer17": 26.614301681518555, + "max_norm/layer18": 23.6390323638916, + "max_norm/layer19": 23.148977279663086, + "max_norm/layer2": 18.52928352355957, + "max_norm/layer20": 24.404052734375, + "max_norm/layer21": 23.719820022583008, + "max_norm/layer22": 24.551822662353516, + "max_norm/layer23": 23.78716468811035, + "max_norm/layer3": 22.14638900756836, + "max_norm/layer4": 21.958269119262695, + "max_norm/layer5": 27.602540969848633, + "max_norm/layer6": 19.384769439697266, + "max_norm/layer7": 23.659626007080078, + "max_norm/layer8": 23.928421020507812, + "max_norm/layer9": 23.31978416442871, + "mean_norm": 10.181060957411924, + "mean_norm/layer0": 9.706688940525055, + "mean_norm/layer1": 9.709847152233124, + "mean_norm/layer10": 10.061019718647003, + "mean_norm/layer11": 10.305987536907196, + "mean_norm/layer12": 10.701012432575226, + "mean_norm/layer13": 10.030164241790771, + "mean_norm/layer14": 10.360415279865265, + "mean_norm/layer15": 10.607886254787445, + "mean_norm/layer16": 10.116294264793396, + "mean_norm/layer17": 10.536153733730316, + "mean_norm/layer18": 10.177928388118744, + "mean_norm/layer19": 10.209418177604675, + "mean_norm/layer2": 8.686349153518677, + "mean_norm/layer20": 10.316045820713043, + "mean_norm/layer21": 10.270420730113983, + "mean_norm/layer22": 11.059071898460388, + "mean_norm/layer23": 11.008045971393585, + "mean_norm/layer3": 10.50650441646576, + "mean_norm/layer4": 9.613870918750763, + "mean_norm/layer5": 11.462700128555298, + "mean_norm/layer6": 9.236022472381592, + "mean_norm/layer7": 9.649041473865509, + "mean_norm/layer8": 10.034249007701874, + "mean_norm/layer9": 9.980324864387512, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7100 + }, + { + "epoch": 2.96, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.465622629723821, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.714928388595581, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8305, + "eval_samples_per_second": 20.371, + "eval_steps_per_second": 0.676, + "step": 7100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 2.99, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6726, + "max_norm": 27.709001541137695, + "max_norm/layer0": 21.556224822998047, + "max_norm/layer1": 23.0113525390625, + "max_norm/layer10": 24.326719284057617, + "max_norm/layer11": 22.943187713623047, + "max_norm/layer12": 24.772979736328125, + "max_norm/layer13": 21.37757110595703, + "max_norm/layer14": 23.051734924316406, + "max_norm/layer15": 26.927146911621094, + "max_norm/layer16": 22.884979248046875, + "max_norm/layer17": 26.728662490844727, + "max_norm/layer18": 23.741443634033203, + "max_norm/layer19": 23.258390426635742, + "max_norm/layer2": 18.579376220703125, + "max_norm/layer20": 24.51500701904297, + "max_norm/layer21": 23.80166244506836, + "max_norm/layer22": 24.64849281311035, + "max_norm/layer23": 23.88472557067871, + "max_norm/layer3": 22.230770111083984, + "max_norm/layer4": 22.012615203857422, + "max_norm/layer5": 27.709001541137695, + "max_norm/layer6": 19.437652587890625, + "max_norm/layer7": 23.738452911376953, + "max_norm/layer8": 23.992197036743164, + "max_norm/layer9": 23.42462158203125, + "mean_norm": 10.191307773192724, + "mean_norm/layer0": 9.716896176338196, + "mean_norm/layer1": 9.718885600566864, + "mean_norm/layer10": 10.07063364982605, + "mean_norm/layer11": 10.316668629646301, + "mean_norm/layer12": 10.714253962039948, + "mean_norm/layer13": 10.039902150630951, + "mean_norm/layer14": 10.371422827243805, + "mean_norm/layer15": 10.620187282562256, + "mean_norm/layer16": 10.126117765903473, + "mean_norm/layer17": 10.547522008419037, + "mean_norm/layer18": 10.187499582767487, + "mean_norm/layer19": 10.219323873519897, + "mean_norm/layer2": 8.689531564712524, + "mean_norm/layer20": 10.326024532318115, + "mean_norm/layer21": 10.280332446098328, + "mean_norm/layer22": 11.072968006134033, + "mean_norm/layer23": 11.021589159965515, + "mean_norm/layer3": 10.518806040287018, + "mean_norm/layer4": 9.621297419071198, + "mean_norm/layer5": 11.47957170009613, + "mean_norm/layer6": 9.241807997226715, + "mean_norm/layer7": 9.656856834888458, + "mean_norm/layer8": 10.043777287006378, + "mean_norm/layer9": 9.98951005935669, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7150 + }, + { + "epoch": 2.99, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46464105652969256, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7129509449005127, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9382, + "eval_samples_per_second": 22.033, + "eval_steps_per_second": 0.731, + "step": 7150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.01, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.6093, + "max_norm": 27.824810028076172, + "max_norm/layer0": 21.625444412231445, + "max_norm/layer1": 23.094030380249023, + "max_norm/layer10": 24.410734176635742, + "max_norm/layer11": 23.041915893554688, + "max_norm/layer12": 24.885108947753906, + "max_norm/layer13": 21.451623916625977, + "max_norm/layer14": 23.14749526977539, + "max_norm/layer15": 27.040794372558594, + "max_norm/layer16": 22.965412139892578, + "max_norm/layer17": 26.842836380004883, + "max_norm/layer18": 23.85369300842285, + "max_norm/layer19": 23.35756492614746, + "max_norm/layer2": 18.625410079956055, + "max_norm/layer20": 24.62005043029785, + "max_norm/layer21": 23.91094207763672, + "max_norm/layer22": 24.742820739746094, + "max_norm/layer23": 23.971527099609375, + "max_norm/layer3": 22.325895309448242, + "max_norm/layer4": 22.078996658325195, + "max_norm/layer5": 27.824810028076172, + "max_norm/layer6": 19.494665145874023, + "max_norm/layer7": 23.832578659057617, + "max_norm/layer8": 24.08106803894043, + "max_norm/layer9": 23.532432556152344, + "mean_norm": 10.201683916151524, + "mean_norm/layer0": 9.727182745933533, + "mean_norm/layer1": 9.728063941001892, + "mean_norm/layer10": 10.080385386943817, + "mean_norm/layer11": 10.327516376972198, + "mean_norm/layer12": 10.727601408958435, + "mean_norm/layer13": 10.049872696399689, + "mean_norm/layer14": 10.382597625255585, + "mean_norm/layer15": 10.632773756980896, + "mean_norm/layer16": 10.136172950267792, + "mean_norm/layer17": 10.559046685695648, + "mean_norm/layer18": 10.19717562198639, + "mean_norm/layer19": 10.229287981987, + "mean_norm/layer2": 8.692719519138336, + "mean_norm/layer20": 10.336449027061462, + "mean_norm/layer21": 10.290430724620819, + "mean_norm/layer22": 11.086778223514557, + "mean_norm/layer23": 11.035368502140045, + "mean_norm/layer3": 10.53110146522522, + "mean_norm/layer4": 9.628753662109375, + "mean_norm/layer5": 11.49661272764206, + "mean_norm/layer6": 9.247560143470764, + "mean_norm/layer7": 9.664614796638489, + "mean_norm/layer8": 10.053438544273376, + "mean_norm/layer9": 9.99890947341919, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7200 + }, + { + "epoch": 3.01, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46351346418271866, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7328038215637207, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9734, + "eval_samples_per_second": 20.128, + "eval_steps_per_second": 0.668, + "step": 7200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.03, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4824, + "max_norm": 27.938352584838867, + "max_norm/layer0": 21.70029640197754, + "max_norm/layer1": 23.16924476623535, + "max_norm/layer10": 24.499082565307617, + "max_norm/layer11": 23.14937400817871, + "max_norm/layer12": 24.984052658081055, + "max_norm/layer13": 21.552579879760742, + "max_norm/layer14": 23.241153717041016, + "max_norm/layer15": 27.157886505126953, + "max_norm/layer16": 23.04047393798828, + "max_norm/layer17": 26.968616485595703, + "max_norm/layer18": 23.939163208007812, + "max_norm/layer19": 23.467212677001953, + "max_norm/layer2": 18.67315673828125, + "max_norm/layer20": 24.7244873046875, + "max_norm/layer21": 24.00645637512207, + "max_norm/layer22": 24.86109161376953, + "max_norm/layer23": 24.05797004699707, + "max_norm/layer3": 22.41858673095703, + "max_norm/layer4": 22.14661979675293, + "max_norm/layer5": 27.938352584838867, + "max_norm/layer6": 19.537410736083984, + "max_norm/layer7": 23.92576026916504, + "max_norm/layer8": 24.154558181762695, + "max_norm/layer9": 23.64275550842285, + "mean_norm": 10.212615164617697, + "mean_norm/layer0": 9.738060355186462, + "mean_norm/layer1": 9.737515270709991, + "mean_norm/layer10": 10.090328097343445, + "mean_norm/layer11": 10.338834047317505, + "mean_norm/layer12": 10.741642594337463, + "mean_norm/layer13": 10.060389280319214, + "mean_norm/layer14": 10.394351184368134, + "mean_norm/layer15": 10.646148383617401, + "mean_norm/layer16": 10.14692997932434, + "mean_norm/layer17": 10.571349322795868, + "mean_norm/layer18": 10.207534611225128, + "mean_norm/layer19": 10.240472435951233, + "mean_norm/layer2": 8.696077167987823, + "mean_norm/layer20": 10.347783148288727, + "mean_norm/layer21": 10.30154174566269, + "mean_norm/layer22": 11.101174712181091, + "mean_norm/layer23": 11.049887597560883, + "mean_norm/layer3": 10.543985962867737, + "mean_norm/layer4": 9.636641085147858, + "mean_norm/layer5": 11.513911306858063, + "mean_norm/layer6": 9.253595232963562, + "mean_norm/layer7": 9.67268419265747, + "mean_norm/layer8": 10.063383936882019, + "mean_norm/layer9": 10.00854229927063, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7250 + }, + { + "epoch": 3.03, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46372032464924984, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.735767364501953, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8416, + "eval_samples_per_second": 20.352, + "eval_steps_per_second": 0.676, + "step": 7250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.05, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4742, + "max_norm": 28.060808181762695, + "max_norm/layer0": 21.76616668701172, + "max_norm/layer1": 23.24862289428711, + "max_norm/layer10": 24.570327758789062, + "max_norm/layer11": 23.24647331237793, + "max_norm/layer12": 25.09784698486328, + "max_norm/layer13": 21.668365478515625, + "max_norm/layer14": 23.325544357299805, + "max_norm/layer15": 27.291521072387695, + "max_norm/layer16": 23.135894775390625, + "max_norm/layer17": 27.086589813232422, + "max_norm/layer18": 24.027212142944336, + "max_norm/layer19": 23.55608558654785, + "max_norm/layer2": 18.72525978088379, + "max_norm/layer20": 24.830610275268555, + "max_norm/layer21": 24.100738525390625, + "max_norm/layer22": 24.97201156616211, + "max_norm/layer23": 24.144886016845703, + "max_norm/layer3": 22.505525588989258, + "max_norm/layer4": 22.22715950012207, + "max_norm/layer5": 28.060808181762695, + "max_norm/layer6": 19.58978843688965, + "max_norm/layer7": 24.01059913635254, + "max_norm/layer8": 24.2260799407959, + "max_norm/layer9": 23.773536682128906, + "mean_norm": 10.223552122712135, + "mean_norm/layer0": 9.749425172805786, + "mean_norm/layer1": 9.747048020362854, + "mean_norm/layer10": 10.100198149681091, + "mean_norm/layer11": 10.350200355052948, + "mean_norm/layer12": 10.755703628063202, + "mean_norm/layer13": 10.07078105211258, + "mean_norm/layer14": 10.406133830547333, + "mean_norm/layer15": 10.659375131130219, + "mean_norm/layer16": 10.157630205154419, + "mean_norm/layer17": 10.583497643470764, + "mean_norm/layer18": 10.21798974275589, + "mean_norm/layer19": 10.251213431358337, + "mean_norm/layer2": 8.699485063552856, + "mean_norm/layer20": 10.359046816825867, + "mean_norm/layer21": 10.312615513801575, + "mean_norm/layer22": 11.115482449531555, + "mean_norm/layer23": 11.064455330371857, + "mean_norm/layer3": 10.557074010372162, + "mean_norm/layer4": 9.644611239433289, + "mean_norm/layer5": 11.531232297420502, + "mean_norm/layer6": 9.25971406698227, + "mean_norm/layer7": 9.680716574192047, + "mean_norm/layer8": 10.073291182518005, + "mean_norm/layer9": 10.018330037593842, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7300 + }, + { + "epoch": 3.05, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4618301878374158, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7427256107330322, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8228, + "eval_samples_per_second": 20.384, + "eval_steps_per_second": 0.677, + "step": 7300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.07, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4903, + "max_norm": 28.1783390045166, + "max_norm/layer0": 21.83902931213379, + "max_norm/layer1": 23.328245162963867, + "max_norm/layer10": 24.659210205078125, + "max_norm/layer11": 23.3525333404541, + "max_norm/layer12": 25.218076705932617, + "max_norm/layer13": 21.76858139038086, + "max_norm/layer14": 23.42473793029785, + "max_norm/layer15": 27.404930114746094, + "max_norm/layer16": 23.211116790771484, + "max_norm/layer17": 27.211097717285156, + "max_norm/layer18": 24.133827209472656, + "max_norm/layer19": 23.656211853027344, + "max_norm/layer2": 18.778493881225586, + "max_norm/layer20": 24.922006607055664, + "max_norm/layer21": 24.207969665527344, + "max_norm/layer22": 25.06915283203125, + "max_norm/layer23": 24.239763259887695, + "max_norm/layer3": 22.60003089904785, + "max_norm/layer4": 22.29958152770996, + "max_norm/layer5": 28.1783390045166, + "max_norm/layer6": 19.645545959472656, + "max_norm/layer7": 24.08893585205078, + "max_norm/layer8": 24.30266761779785, + "max_norm/layer9": 23.877931594848633, + "mean_norm": 10.234688145418962, + "mean_norm/layer0": 9.761431992053986, + "mean_norm/layer1": 9.756781339645386, + "mean_norm/layer10": 10.110297739505768, + "mean_norm/layer11": 10.361783504486084, + "mean_norm/layer12": 10.770005881786346, + "mean_norm/layer13": 10.08151239156723, + "mean_norm/layer14": 10.418040454387665, + "mean_norm/layer15": 10.672817826271057, + "mean_norm/layer16": 10.168405294418335, + "mean_norm/layer17": 10.595774412155151, + "mean_norm/layer18": 10.22852224111557, + "mean_norm/layer19": 10.262270987033844, + "mean_norm/layer2": 8.702980160713196, + "mean_norm/layer20": 10.370457172393799, + "mean_norm/layer21": 10.323876857757568, + "mean_norm/layer22": 11.13010424375534, + "mean_norm/layer23": 11.079138576984406, + "mean_norm/layer3": 10.570332705974579, + "mean_norm/layer4": 9.652642965316772, + "mean_norm/layer5": 11.548939108848572, + "mean_norm/layer6": 9.265985012054443, + "mean_norm/layer7": 9.688855290412903, + "mean_norm/layer8": 10.083318591117859, + "mean_norm/layer9": 10.028240740299225, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7350 + }, + { + "epoch": 3.07, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4628604340824927, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.739495277404785, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9483, + "eval_samples_per_second": 22.013, + "eval_steps_per_second": 0.731, + "step": 7350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.09, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5219, + "max_norm": 28.30512046813965, + "max_norm/layer0": 21.925140380859375, + "max_norm/layer1": 23.402666091918945, + "max_norm/layer10": 24.75094223022461, + "max_norm/layer11": 23.466140747070312, + "max_norm/layer12": 25.3124942779541, + "max_norm/layer13": 21.85954475402832, + "max_norm/layer14": 23.502534866333008, + "max_norm/layer15": 27.527902603149414, + "max_norm/layer16": 23.29158592224121, + "max_norm/layer17": 27.323348999023438, + "max_norm/layer18": 24.239091873168945, + "max_norm/layer19": 23.75176239013672, + "max_norm/layer2": 18.829025268554688, + "max_norm/layer20": 25.023799896240234, + "max_norm/layer21": 24.31355094909668, + "max_norm/layer22": 25.157793045043945, + "max_norm/layer23": 24.331005096435547, + "max_norm/layer3": 22.704940795898438, + "max_norm/layer4": 22.374662399291992, + "max_norm/layer5": 28.30512046813965, + "max_norm/layer6": 19.703712463378906, + "max_norm/layer7": 24.16960906982422, + "max_norm/layer8": 24.37641143798828, + "max_norm/layer9": 23.971576690673828, + "mean_norm": 10.245796350141367, + "mean_norm/layer0": 9.773649513721466, + "mean_norm/layer1": 9.76639074087143, + "mean_norm/layer10": 10.12041312456131, + "mean_norm/layer11": 10.373321115970612, + "mean_norm/layer12": 10.784271001815796, + "mean_norm/layer13": 10.09208732843399, + "mean_norm/layer14": 10.429891586303711, + "mean_norm/layer15": 10.686288714408875, + "mean_norm/layer16": 10.17914080619812, + "mean_norm/layer17": 10.608086168766022, + "mean_norm/layer18": 10.238989114761353, + "mean_norm/layer19": 10.273307204246521, + "mean_norm/layer2": 8.706504940986633, + "mean_norm/layer20": 10.381437599658966, + "mean_norm/layer21": 10.334827601909637, + "mean_norm/layer22": 11.144693374633789, + "mean_norm/layer23": 11.09385484457016, + "mean_norm/layer3": 10.583644211292267, + "mean_norm/layer4": 9.66067487001419, + "mean_norm/layer5": 11.566678524017334, + "mean_norm/layer6": 9.272311866283417, + "mean_norm/layer7": 9.697041988372803, + "mean_norm/layer8": 10.093447387218475, + "mean_norm/layer9": 10.038158774375916, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7400 + }, + { + "epoch": 3.09, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4631037993372353, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7434771060943604, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9589, + "eval_samples_per_second": 20.152, + "eval_steps_per_second": 0.669, + "step": 7400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.11, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5297, + "max_norm": 28.41901206970215, + "max_norm/layer0": 21.99617576599121, + "max_norm/layer1": 23.478212356567383, + "max_norm/layer10": 24.831113815307617, + "max_norm/layer11": 23.557214736938477, + "max_norm/layer12": 25.407339096069336, + "max_norm/layer13": 21.933692932128906, + "max_norm/layer14": 23.58243179321289, + "max_norm/layer15": 27.664417266845703, + "max_norm/layer16": 23.40688133239746, + "max_norm/layer17": 27.449398040771484, + "max_norm/layer18": 24.320056915283203, + "max_norm/layer19": 23.8420467376709, + "max_norm/layer2": 18.881885528564453, + "max_norm/layer20": 25.124309539794922, + "max_norm/layer21": 24.40587043762207, + "max_norm/layer22": 25.251537322998047, + "max_norm/layer23": 24.414310455322266, + "max_norm/layer3": 22.804298400878906, + "max_norm/layer4": 22.448192596435547, + "max_norm/layer5": 28.41901206970215, + "max_norm/layer6": 19.762104034423828, + "max_norm/layer7": 24.261402130126953, + "max_norm/layer8": 24.460205078125, + "max_norm/layer9": 24.068944931030273, + "mean_norm": 10.256785544256369, + "mean_norm/layer0": 9.786031067371368, + "mean_norm/layer1": 9.776026725769043, + "mean_norm/layer10": 10.13040566444397, + "mean_norm/layer11": 10.384915590286255, + "mean_norm/layer12": 10.798379123210907, + "mean_norm/layer13": 10.102573335170746, + "mean_norm/layer14": 10.441614508628845, + "mean_norm/layer15": 10.699365377426147, + "mean_norm/layer16": 10.189636588096619, + "mean_norm/layer17": 10.620143711566925, + "mean_norm/layer18": 10.249273598194122, + "mean_norm/layer19": 10.28394889831543, + "mean_norm/layer2": 8.710040807723999, + "mean_norm/layer20": 10.392243266105652, + "mean_norm/layer21": 10.345543622970581, + "mean_norm/layer22": 11.159203112125397, + "mean_norm/layer23": 11.108225405216217, + "mean_norm/layer3": 10.59694367647171, + "mean_norm/layer4": 9.66866660118103, + "mean_norm/layer5": 11.584315299987793, + "mean_norm/layer6": 9.278502762317657, + "mean_norm/layer7": 9.705314993858337, + "mean_norm/layer8": 10.10358864068985, + "mean_norm/layer9": 10.047950685024261, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7450 + }, + { + "epoch": 3.11, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46243454488669317, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.741889238357544, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 12.0032, + "eval_samples_per_second": 20.078, + "eval_steps_per_second": 0.666, + "step": 7450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.13, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5378, + "max_norm": 28.534168243408203, + "max_norm/layer0": 22.058876037597656, + "max_norm/layer1": 23.55440330505371, + "max_norm/layer10": 24.924272537231445, + "max_norm/layer11": 23.644363403320312, + "max_norm/layer12": 25.500591278076172, + "max_norm/layer13": 22.042232513427734, + "max_norm/layer14": 23.674577713012695, + "max_norm/layer15": 27.777328491210938, + "max_norm/layer16": 23.501466751098633, + "max_norm/layer17": 27.558422088623047, + "max_norm/layer18": 24.424163818359375, + "max_norm/layer19": 23.938682556152344, + "max_norm/layer2": 18.931631088256836, + "max_norm/layer20": 25.224212646484375, + "max_norm/layer21": 24.5081729888916, + "max_norm/layer22": 25.363332748413086, + "max_norm/layer23": 24.50674819946289, + "max_norm/layer3": 22.900821685791016, + "max_norm/layer4": 22.509111404418945, + "max_norm/layer5": 28.534168243408203, + "max_norm/layer6": 19.816333770751953, + "max_norm/layer7": 24.353036880493164, + "max_norm/layer8": 24.543941497802734, + "max_norm/layer9": 24.16282081604004, + "mean_norm": 10.267906568944454, + "mean_norm/layer0": 9.798717558383942, + "mean_norm/layer1": 9.785801529884338, + "mean_norm/layer10": 10.14056795835495, + "mean_norm/layer11": 10.396467983722687, + "mean_norm/layer12": 10.812629520893097, + "mean_norm/layer13": 10.113163471221924, + "mean_norm/layer14": 10.453515112400055, + "mean_norm/layer15": 10.712714493274689, + "mean_norm/layer16": 10.200285851955414, + "mean_norm/layer17": 10.632267236709595, + "mean_norm/layer18": 10.259525001049042, + "mean_norm/layer19": 10.294664680957794, + "mean_norm/layer2": 8.713631331920624, + "mean_norm/layer20": 10.403029263019562, + "mean_norm/layer21": 10.356555461883545, + "mean_norm/layer22": 11.173887729644775, + "mean_norm/layer23": 11.122698366641998, + "mean_norm/layer3": 10.61043643951416, + "mean_norm/layer4": 9.676729619503021, + "mean_norm/layer5": 11.602260768413544, + "mean_norm/layer6": 9.284881472587585, + "mean_norm/layer7": 9.7137091755867, + "mean_norm/layer8": 10.113835334777832, + "mean_norm/layer9": 10.057782292366028, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7500 + }, + { + "epoch": 3.13, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4612461112260336, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7466063499450684, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8975, + "eval_samples_per_second": 20.256, + "eval_steps_per_second": 0.672, + "step": 7500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.15, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5262, + "max_norm": 28.647478103637695, + "max_norm/layer0": 22.12501335144043, + "max_norm/layer1": 23.629316329956055, + "max_norm/layer10": 25.00779151916504, + "max_norm/layer11": 23.737573623657227, + "max_norm/layer12": 25.5867919921875, + "max_norm/layer13": 22.13935661315918, + "max_norm/layer14": 23.769336700439453, + "max_norm/layer15": 27.88351821899414, + "max_norm/layer16": 23.595199584960938, + "max_norm/layer17": 27.670772552490234, + "max_norm/layer18": 24.5206241607666, + "max_norm/layer19": 24.02391815185547, + "max_norm/layer2": 18.966272354125977, + "max_norm/layer20": 25.31734848022461, + "max_norm/layer21": 24.615201950073242, + "max_norm/layer22": 25.462045669555664, + "max_norm/layer23": 24.59248924255371, + "max_norm/layer3": 22.99334716796875, + "max_norm/layer4": 22.572772979736328, + "max_norm/layer5": 28.647478103637695, + "max_norm/layer6": 19.873327255249023, + "max_norm/layer7": 24.456520080566406, + "max_norm/layer8": 24.614551544189453, + "max_norm/layer9": 24.24704933166504, + "mean_norm": 10.278987641135851, + "mean_norm/layer0": 9.811449825763702, + "mean_norm/layer1": 9.795596778392792, + "mean_norm/layer10": 10.150748670101166, + "mean_norm/layer11": 10.407971441745758, + "mean_norm/layer12": 10.826962232589722, + "mean_norm/layer13": 10.123676836490631, + "mean_norm/layer14": 10.465408980846405, + "mean_norm/layer15": 10.726069808006287, + "mean_norm/layer16": 10.210875153541565, + "mean_norm/layer17": 10.644302904605865, + "mean_norm/layer18": 10.269866168498993, + "mean_norm/layer19": 10.305279195308685, + "mean_norm/layer2": 8.717224657535553, + "mean_norm/layer20": 10.413566410541534, + "mean_norm/layer21": 10.367369532585144, + "mean_norm/layer22": 11.18840491771698, + "mean_norm/layer23": 11.13710218667984, + "mean_norm/layer3": 10.623844742774963, + "mean_norm/layer4": 9.68492478132248, + "mean_norm/layer5": 11.620170950889587, + "mean_norm/layer6": 9.291176974773407, + "mean_norm/layer7": 9.722011387348175, + "mean_norm/layer8": 10.12408995628357, + "mean_norm/layer9": 10.067608892917633, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7550 + }, + { + "epoch": 3.15, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4627468636302795, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.742647886276245, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9512, + "eval_samples_per_second": 20.165, + "eval_steps_per_second": 0.669, + "step": 7550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.17, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5466, + "max_norm": 28.759456634521484, + "max_norm/layer0": 22.189687728881836, + "max_norm/layer1": 23.718957901000977, + "max_norm/layer10": 25.11297607421875, + "max_norm/layer11": 23.83050537109375, + "max_norm/layer12": 25.688610076904297, + "max_norm/layer13": 22.221534729003906, + "max_norm/layer14": 23.87668800354004, + "max_norm/layer15": 28.021175384521484, + "max_norm/layer16": 23.694242477416992, + "max_norm/layer17": 27.787132263183594, + "max_norm/layer18": 24.62793731689453, + "max_norm/layer19": 24.113933563232422, + "max_norm/layer2": 19.001083374023438, + "max_norm/layer20": 25.41383171081543, + "max_norm/layer21": 24.711917877197266, + "max_norm/layer22": 25.558143615722656, + "max_norm/layer23": 24.674909591674805, + "max_norm/layer3": 23.080352783203125, + "max_norm/layer4": 22.64613151550293, + "max_norm/layer5": 28.759456634521484, + "max_norm/layer6": 19.9383487701416, + "max_norm/layer7": 24.539579391479492, + "max_norm/layer8": 24.692691802978516, + "max_norm/layer9": 24.328855514526367, + "mean_norm": 10.29014177620411, + "mean_norm/layer0": 9.824274837970734, + "mean_norm/layer1": 9.805485486984253, + "mean_norm/layer10": 10.160942137241364, + "mean_norm/layer11": 10.419573247432709, + "mean_norm/layer12": 10.841314256191254, + "mean_norm/layer13": 10.134314954280853, + "mean_norm/layer14": 10.47724461555481, + "mean_norm/layer15": 10.739534556865692, + "mean_norm/layer16": 10.221598386764526, + "mean_norm/layer17": 10.656368911266327, + "mean_norm/layer18": 10.280156254768372, + "mean_norm/layer19": 10.315918445587158, + "mean_norm/layer2": 8.720892071723938, + "mean_norm/layer20": 10.424446642398834, + "mean_norm/layer21": 10.378287017345428, + "mean_norm/layer22": 11.202922701835632, + "mean_norm/layer23": 11.151463150978088, + "mean_norm/layer3": 10.637423694133759, + "mean_norm/layer4": 9.69320422410965, + "mean_norm/layer5": 11.6382976770401, + "mean_norm/layer6": 9.297437250614166, + "mean_norm/layer7": 9.730381071567535, + "mean_norm/layer8": 10.134437918663025, + "mean_norm/layer9": 10.077483117580414, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7600 + }, + { + "epoch": 3.17, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4620857213548955, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7406821250915527, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9297, + "eval_samples_per_second": 20.202, + "eval_steps_per_second": 0.671, + "step": 7600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.19, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5417, + "max_norm": 28.87610626220703, + "max_norm/layer0": 22.26255989074707, + "max_norm/layer1": 23.79456329345703, + "max_norm/layer10": 25.207901000976562, + "max_norm/layer11": 23.90155601501465, + "max_norm/layer12": 25.78806495666504, + "max_norm/layer13": 22.295835494995117, + "max_norm/layer14": 23.981624603271484, + "max_norm/layer15": 28.134763717651367, + "max_norm/layer16": 23.79250144958496, + "max_norm/layer17": 27.918643951416016, + "max_norm/layer18": 24.73369598388672, + "max_norm/layer19": 24.21535301208496, + "max_norm/layer2": 19.049760818481445, + "max_norm/layer20": 25.499326705932617, + "max_norm/layer21": 24.808273315429688, + "max_norm/layer22": 25.657686233520508, + "max_norm/layer23": 24.76559829711914, + "max_norm/layer3": 23.16707420349121, + "max_norm/layer4": 22.7286376953125, + "max_norm/layer5": 28.87610626220703, + "max_norm/layer6": 19.98716926574707, + "max_norm/layer7": 24.625072479248047, + "max_norm/layer8": 24.779348373413086, + "max_norm/layer9": 24.42043685913086, + "mean_norm": 10.301014435787996, + "mean_norm/layer0": 9.836885809898376, + "mean_norm/layer1": 9.81521886587143, + "mean_norm/layer10": 10.170771658420563, + "mean_norm/layer11": 10.430792689323425, + "mean_norm/layer12": 10.855295896530151, + "mean_norm/layer13": 10.144669532775879, + "mean_norm/layer14": 10.488730907440186, + "mean_norm/layer15": 10.75255537033081, + "mean_norm/layer16": 10.232070505619049, + "mean_norm/layer17": 10.668150544166565, + "mean_norm/layer18": 10.290162086486816, + "mean_norm/layer19": 10.326179146766663, + "mean_norm/layer2": 8.724476277828217, + "mean_norm/layer20": 10.43507844209671, + "mean_norm/layer21": 10.388847172260284, + "mean_norm/layer22": 11.217085540294647, + "mean_norm/layer23": 11.16545057296753, + "mean_norm/layer3": 10.650694847106934, + "mean_norm/layer4": 9.701324820518494, + "mean_norm/layer5": 11.656121969223022, + "mean_norm/layer6": 9.303574085235596, + "mean_norm/layer7": 9.738611280918121, + "mean_norm/layer8": 10.144423842430115, + "mean_norm/layer9": 10.087174594402313, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7650 + }, + { + "epoch": 3.19, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4635945859342995, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7404425144195557, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9178, + "eval_samples_per_second": 22.074, + "eval_steps_per_second": 0.733, + "step": 7650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.22, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5543, + "max_norm": 28.989912033081055, + "max_norm/layer0": 22.333951950073242, + "max_norm/layer1": 23.86414909362793, + "max_norm/layer10": 25.30396270751953, + "max_norm/layer11": 23.973237991333008, + "max_norm/layer12": 25.900819778442383, + "max_norm/layer13": 22.36374282836914, + "max_norm/layer14": 24.077177047729492, + "max_norm/layer15": 28.262537002563477, + "max_norm/layer16": 23.878515243530273, + "max_norm/layer17": 28.032825469970703, + "max_norm/layer18": 24.851049423217773, + "max_norm/layer19": 24.301414489746094, + "max_norm/layer2": 19.102933883666992, + "max_norm/layer20": 25.588642120361328, + "max_norm/layer21": 24.90848159790039, + "max_norm/layer22": 25.761886596679688, + "max_norm/layer23": 24.848621368408203, + "max_norm/layer3": 23.259109497070312, + "max_norm/layer4": 22.849287033081055, + "max_norm/layer5": 28.989912033081055, + "max_norm/layer6": 20.03278350830078, + "max_norm/layer7": 24.701374053955078, + "max_norm/layer8": 24.87116050720215, + "max_norm/layer9": 24.52387237548828, + "mean_norm": 10.31198395540317, + "mean_norm/layer0": 9.849559903144836, + "mean_norm/layer1": 9.82489401102066, + "mean_norm/layer10": 10.180826425552368, + "mean_norm/layer11": 10.442092299461365, + "mean_norm/layer12": 10.869353592395782, + "mean_norm/layer13": 10.155152142047882, + "mean_norm/layer14": 10.500398457050323, + "mean_norm/layer15": 10.765804052352905, + "mean_norm/layer16": 10.242531597614288, + "mean_norm/layer17": 10.67978948354721, + "mean_norm/layer18": 10.300297379493713, + "mean_norm/layer19": 10.336560845375061, + "mean_norm/layer2": 8.72812283039093, + "mean_norm/layer20": 10.445524156093597, + "mean_norm/layer21": 10.399671375751495, + "mean_norm/layer22": 11.231338143348694, + "mean_norm/layer23": 11.17959988117218, + "mean_norm/layer3": 10.664167523384094, + "mean_norm/layer4": 9.709515035152435, + "mean_norm/layer5": 11.674124658107758, + "mean_norm/layer6": 9.309807479381561, + "mean_norm/layer7": 9.746842324733734, + "mean_norm/layer8": 10.15455275774002, + "mean_norm/layer9": 10.09708857536316, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7700 + }, + { + "epoch": 3.22, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4629983410601802, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.741414785385132, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7003, + "eval_samples_per_second": 20.598, + "eval_steps_per_second": 0.684, + "step": 7700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.24, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5553, + "max_norm": 29.090238571166992, + "max_norm/layer0": 22.41193389892578, + "max_norm/layer1": 23.93515396118164, + "max_norm/layer10": 25.398143768310547, + "max_norm/layer11": 24.047224044799805, + "max_norm/layer12": 25.994855880737305, + "max_norm/layer13": 22.43844985961914, + "max_norm/layer14": 24.178451538085938, + "max_norm/layer15": 28.364883422851562, + "max_norm/layer16": 23.977371215820312, + "max_norm/layer17": 28.133155822753906, + "max_norm/layer18": 24.957571029663086, + "max_norm/layer19": 24.386947631835938, + "max_norm/layer2": 19.165626525878906, + "max_norm/layer20": 25.671714782714844, + "max_norm/layer21": 25.00211524963379, + "max_norm/layer22": 25.86479949951172, + "max_norm/layer23": 24.936710357666016, + "max_norm/layer3": 23.344837188720703, + "max_norm/layer4": 22.948711395263672, + "max_norm/layer5": 29.090238571166992, + "max_norm/layer6": 20.085012435913086, + "max_norm/layer7": 24.796207427978516, + "max_norm/layer8": 24.96137809753418, + "max_norm/layer9": 24.61630630493164, + "mean_norm": 10.322781873246035, + "mean_norm/layer0": 9.862114548683167, + "mean_norm/layer1": 9.834554076194763, + "mean_norm/layer10": 10.19078516960144, + "mean_norm/layer11": 10.453184068202972, + "mean_norm/layer12": 10.883156538009644, + "mean_norm/layer13": 10.16549926996231, + "mean_norm/layer14": 10.511900305747986, + "mean_norm/layer15": 10.778773725032806, + "mean_norm/layer16": 10.252846658229828, + "mean_norm/layer17": 10.691301107406616, + "mean_norm/layer18": 10.310111284255981, + "mean_norm/layer19": 10.346852660179138, + "mean_norm/layer2": 8.731664061546326, + "mean_norm/layer20": 10.455866873264313, + "mean_norm/layer21": 10.410119354724884, + "mean_norm/layer22": 11.245464563369751, + "mean_norm/layer23": 11.193513989448547, + "mean_norm/layer3": 10.677456438541412, + "mean_norm/layer4": 9.71753478050232, + "mean_norm/layer5": 11.691821098327637, + "mean_norm/layer6": 9.316016852855682, + "mean_norm/layer7": 9.754923164844513, + "mean_norm/layer8": 10.164519965648651, + "mean_norm/layer9": 10.106784403324127, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7750 + }, + { + "epoch": 3.24, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46314436021302574, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7383084297180176, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7215, + "eval_samples_per_second": 20.56, + "eval_steps_per_second": 0.683, + "step": 7750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.26, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5628, + "max_norm": 29.21254539489746, + "max_norm/layer0": 22.484031677246094, + "max_norm/layer1": 24.008319854736328, + "max_norm/layer10": 25.487390518188477, + "max_norm/layer11": 24.109447479248047, + "max_norm/layer12": 26.10677146911621, + "max_norm/layer13": 22.515703201293945, + "max_norm/layer14": 24.291309356689453, + "max_norm/layer15": 28.477415084838867, + "max_norm/layer16": 24.077625274658203, + "max_norm/layer17": 28.249710083007812, + "max_norm/layer18": 25.04519271850586, + "max_norm/layer19": 24.4896183013916, + "max_norm/layer2": 19.21530532836914, + "max_norm/layer20": 25.777645111083984, + "max_norm/layer21": 25.095863342285156, + "max_norm/layer22": 25.952531814575195, + "max_norm/layer23": 25.035606384277344, + "max_norm/layer3": 23.437124252319336, + "max_norm/layer4": 23.04496192932129, + "max_norm/layer5": 29.21254539489746, + "max_norm/layer6": 20.13669776916504, + "max_norm/layer7": 24.908952713012695, + "max_norm/layer8": 25.054763793945312, + "max_norm/layer9": 24.6956787109375, + "mean_norm": 10.33362782249848, + "mean_norm/layer0": 9.874791443347931, + "mean_norm/layer1": 9.844236731529236, + "mean_norm/layer10": 10.200762331485748, + "mean_norm/layer11": 10.464483559131622, + "mean_norm/layer12": 10.897128105163574, + "mean_norm/layer13": 10.175809919834137, + "mean_norm/layer14": 10.523499190807343, + "mean_norm/layer15": 10.791725218296051, + "mean_norm/layer16": 10.263132691383362, + "mean_norm/layer17": 10.70292180776596, + "mean_norm/layer18": 10.320022165775299, + "mean_norm/layer19": 10.357090592384338, + "mean_norm/layer2": 8.735245108604431, + "mean_norm/layer20": 10.466160774230957, + "mean_norm/layer21": 10.42063820362091, + "mean_norm/layer22": 11.259634852409363, + "mean_norm/layer23": 11.207477986812592, + "mean_norm/layer3": 10.69071638584137, + "mean_norm/layer4": 9.72552090883255, + "mean_norm/layer5": 11.709686279296875, + "mean_norm/layer6": 9.32220333814621, + "mean_norm/layer7": 9.763081669807434, + "mean_norm/layer8": 10.174527645111084, + "mean_norm/layer9": 10.116570830345154, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7800 + }, + { + "epoch": 3.26, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4632457624025018, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.736220121383667, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9335, + "eval_samples_per_second": 20.195, + "eval_steps_per_second": 0.67, + "step": 7800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.28, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5544, + "max_norm": 29.331188201904297, + "max_norm/layer0": 22.55216407775879, + "max_norm/layer1": 24.07997703552246, + "max_norm/layer10": 25.5628719329834, + "max_norm/layer11": 24.17657470703125, + "max_norm/layer12": 26.19219970703125, + "max_norm/layer13": 22.586214065551758, + "max_norm/layer14": 24.382736206054688, + "max_norm/layer15": 28.602956771850586, + "max_norm/layer16": 24.1601619720459, + "max_norm/layer17": 28.35554313659668, + "max_norm/layer18": 25.14252281188965, + "max_norm/layer19": 24.595355987548828, + "max_norm/layer2": 19.27031135559082, + "max_norm/layer20": 25.8691463470459, + "max_norm/layer21": 25.18440055847168, + "max_norm/layer22": 26.064830780029297, + "max_norm/layer23": 25.118104934692383, + "max_norm/layer3": 23.54576301574707, + "max_norm/layer4": 23.14463996887207, + "max_norm/layer5": 29.331188201904297, + "max_norm/layer6": 20.195871353149414, + "max_norm/layer7": 25.005327224731445, + "max_norm/layer8": 25.13247299194336, + "max_norm/layer9": 24.790437698364258, + "mean_norm": 10.344553100566069, + "mean_norm/layer0": 9.88759696483612, + "mean_norm/layer1": 9.854110896587372, + "mean_norm/layer10": 10.210679829120636, + "mean_norm/layer11": 10.475803256034851, + "mean_norm/layer12": 10.911135852336884, + "mean_norm/layer13": 10.186229526996613, + "mean_norm/layer14": 10.535084962844849, + "mean_norm/layer15": 10.804824233055115, + "mean_norm/layer16": 10.273425579071045, + "mean_norm/layer17": 10.714586555957794, + "mean_norm/layer18": 10.32996690273285, + "mean_norm/layer19": 10.367372214794159, + "mean_norm/layer2": 8.738913834095001, + "mean_norm/layer20": 10.476485311985016, + "mean_norm/layer21": 10.431126654148102, + "mean_norm/layer22": 11.273919343948364, + "mean_norm/layer23": 11.221592783927917, + "mean_norm/layer3": 10.70423948764801, + "mean_norm/layer4": 9.73361724615097, + "mean_norm/layer5": 11.727725446224213, + "mean_norm/layer6": 9.328507781028748, + "mean_norm/layer7": 9.771354794502258, + "mean_norm/layer8": 10.184631109237671, + "mean_norm/layer9": 10.126343846321106, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7850 + }, + { + "epoch": 3.28, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46365542724798514, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.735917329788208, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9355, + "eval_samples_per_second": 20.192, + "eval_steps_per_second": 0.67, + "step": 7850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.3, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5519, + "max_norm": 29.44374656677246, + "max_norm/layer0": 22.62066650390625, + "max_norm/layer1": 24.155412673950195, + "max_norm/layer10": 25.649127960205078, + "max_norm/layer11": 24.254257202148438, + "max_norm/layer12": 26.287227630615234, + "max_norm/layer13": 22.658599853515625, + "max_norm/layer14": 24.459514617919922, + "max_norm/layer15": 28.717144012451172, + "max_norm/layer16": 24.274436950683594, + "max_norm/layer17": 28.46417808532715, + "max_norm/layer18": 25.246158599853516, + "max_norm/layer19": 24.703245162963867, + "max_norm/layer2": 19.330106735229492, + "max_norm/layer20": 25.960447311401367, + "max_norm/layer21": 25.28472328186035, + "max_norm/layer22": 26.16750717163086, + "max_norm/layer23": 25.200824737548828, + "max_norm/layer3": 23.6591854095459, + "max_norm/layer4": 23.238862991333008, + "max_norm/layer5": 29.44374656677246, + "max_norm/layer6": 20.259044647216797, + "max_norm/layer7": 25.118812561035156, + "max_norm/layer8": 25.218399047851562, + "max_norm/layer9": 24.899673461914062, + "mean_norm": 10.355501912534237, + "mean_norm/layer0": 9.900353372097015, + "mean_norm/layer1": 9.86406821012497, + "mean_norm/layer10": 10.220719993114471, + "mean_norm/layer11": 10.48711621761322, + "mean_norm/layer12": 10.925248146057129, + "mean_norm/layer13": 10.196601510047913, + "mean_norm/layer14": 10.546653389930725, + "mean_norm/layer15": 10.817915558815002, + "mean_norm/layer16": 10.283754646778107, + "mean_norm/layer17": 10.726405084133148, + "mean_norm/layer18": 10.339860618114471, + "mean_norm/layer19": 10.377592206001282, + "mean_norm/layer2": 8.742589831352234, + "mean_norm/layer20": 10.486961722373962, + "mean_norm/layer21": 10.441667020320892, + "mean_norm/layer22": 11.288079738616943, + "mean_norm/layer23": 11.235736012458801, + "mean_norm/layer3": 10.717736423015594, + "mean_norm/layer4": 9.74189966917038, + "mean_norm/layer5": 11.745728731155396, + "mean_norm/layer6": 9.33476859331131, + "mean_norm/layer7": 9.779621005058289, + "mean_norm/layer8": 10.194773256778717, + "mean_norm/layer9": 10.136194944381714, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7900 + }, + { + "epoch": 3.3, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46300645323533823, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7365753650665283, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9411, + "eval_samples_per_second": 22.027, + "eval_steps_per_second": 0.731, + "step": 7900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.32, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5604, + "max_norm": 29.56292724609375, + "max_norm/layer0": 22.706741333007812, + "max_norm/layer1": 24.238323211669922, + "max_norm/layer10": 25.757524490356445, + "max_norm/layer11": 24.320594787597656, + "max_norm/layer12": 26.380447387695312, + "max_norm/layer13": 22.746694564819336, + "max_norm/layer14": 24.556163787841797, + "max_norm/layer15": 28.821693420410156, + "max_norm/layer16": 24.36968994140625, + "max_norm/layer17": 28.576396942138672, + "max_norm/layer18": 25.369043350219727, + "max_norm/layer19": 24.811838150024414, + "max_norm/layer2": 19.388208389282227, + "max_norm/layer20": 26.059162139892578, + "max_norm/layer21": 25.400894165039062, + "max_norm/layer22": 26.286211013793945, + "max_norm/layer23": 25.288856506347656, + "max_norm/layer3": 23.755037307739258, + "max_norm/layer4": 23.329593658447266, + "max_norm/layer5": 29.56292724609375, + "max_norm/layer6": 20.32733154296875, + "max_norm/layer7": 25.217721939086914, + "max_norm/layer8": 25.305147171020508, + "max_norm/layer9": 24.998611450195312, + "mean_norm": 10.366318744917711, + "mean_norm/layer0": 9.913071632385254, + "mean_norm/layer1": 9.87394368648529, + "mean_norm/layer10": 10.230653047561646, + "mean_norm/layer11": 10.498328745365143, + "mean_norm/layer12": 10.939123094081879, + "mean_norm/layer13": 10.206881523132324, + "mean_norm/layer14": 10.558052361011505, + "mean_norm/layer15": 10.830873608589172, + "mean_norm/layer16": 10.293963611125946, + "mean_norm/layer17": 10.738054513931274, + "mean_norm/layer18": 10.349761128425598, + "mean_norm/layer19": 10.387810349464417, + "mean_norm/layer2": 8.7461838722229, + "mean_norm/layer20": 10.49695074558258, + "mean_norm/layer21": 10.451958894729614, + "mean_norm/layer22": 11.301961421966553, + "mean_norm/layer23": 11.249614596366882, + "mean_norm/layer3": 10.73119992017746, + "mean_norm/layer4": 9.750132262706757, + "mean_norm/layer5": 11.763619303703308, + "mean_norm/layer6": 9.34090131521225, + "mean_norm/layer7": 9.787860095500946, + "mean_norm/layer8": 10.204774379730225, + "mean_norm/layer9": 10.145975768566132, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 7950 + }, + { + "epoch": 3.32, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4639434094660972, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7317562103271484, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7183, + "eval_samples_per_second": 20.566, + "eval_steps_per_second": 0.683, + "step": 7950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.34, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.574, + "max_norm": 29.686235427856445, + "max_norm/layer0": 22.817535400390625, + "max_norm/layer1": 24.31894302368164, + "max_norm/layer10": 25.852500915527344, + "max_norm/layer11": 24.389923095703125, + "max_norm/layer12": 26.46706199645996, + "max_norm/layer13": 22.830928802490234, + "max_norm/layer14": 24.660869598388672, + "max_norm/layer15": 28.929563522338867, + "max_norm/layer16": 24.46345329284668, + "max_norm/layer17": 28.688806533813477, + "max_norm/layer18": 25.51277732849121, + "max_norm/layer19": 24.911882400512695, + "max_norm/layer2": 19.448562622070312, + "max_norm/layer20": 26.146984100341797, + "max_norm/layer21": 25.494787216186523, + "max_norm/layer22": 26.37640953063965, + "max_norm/layer23": 25.375213623046875, + "max_norm/layer3": 23.8410701751709, + "max_norm/layer4": 23.417619705200195, + "max_norm/layer5": 29.686235427856445, + "max_norm/layer6": 20.39133071899414, + "max_norm/layer7": 25.319486618041992, + "max_norm/layer8": 25.389860153198242, + "max_norm/layer9": 25.100292205810547, + "mean_norm": 10.377166591584682, + "mean_norm/layer0": 9.92577999830246, + "mean_norm/layer1": 9.883734285831451, + "mean_norm/layer10": 10.240622818470001, + "mean_norm/layer11": 10.509494483470917, + "mean_norm/layer12": 10.953135788440704, + "mean_norm/layer13": 10.217233061790466, + "mean_norm/layer14": 10.569559216499329, + "mean_norm/layer15": 10.843758702278137, + "mean_norm/layer16": 10.30425751209259, + "mean_norm/layer17": 10.749723374843597, + "mean_norm/layer18": 10.359737277030945, + "mean_norm/layer19": 10.398090779781342, + "mean_norm/layer2": 8.749907433986664, + "mean_norm/layer20": 10.507069289684296, + "mean_norm/layer21": 10.462173759937286, + "mean_norm/layer22": 11.315882444381714, + "mean_norm/layer23": 11.263618886470795, + "mean_norm/layer3": 10.744675993919373, + "mean_norm/layer4": 9.758215069770813, + "mean_norm/layer5": 11.781563222408295, + "mean_norm/layer6": 9.347027242183685, + "mean_norm/layer7": 9.796038210391998, + "mean_norm/layer8": 10.214890122413635, + "mean_norm/layer9": 10.155809223651886, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8000 + }, + { + "epoch": 3.34, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46419488689599786, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7337546348571777, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9253, + "eval_samples_per_second": 22.059, + "eval_steps_per_second": 0.732, + "step": 8000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.36, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5681, + "max_norm": 29.79633331298828, + "max_norm/layer0": 22.923782348632812, + "max_norm/layer1": 24.38690185546875, + "max_norm/layer10": 25.94072151184082, + "max_norm/layer11": 24.459306716918945, + "max_norm/layer12": 26.563783645629883, + "max_norm/layer13": 22.916555404663086, + "max_norm/layer14": 24.759183883666992, + "max_norm/layer15": 29.03226089477539, + "max_norm/layer16": 24.558034896850586, + "max_norm/layer17": 28.802165985107422, + "max_norm/layer18": 25.61612892150879, + "max_norm/layer19": 25.000877380371094, + "max_norm/layer2": 19.50658416748047, + "max_norm/layer20": 26.22553253173828, + "max_norm/layer21": 25.60858726501465, + "max_norm/layer22": 26.475278854370117, + "max_norm/layer23": 25.460458755493164, + "max_norm/layer3": 23.920320510864258, + "max_norm/layer4": 23.51832389831543, + "max_norm/layer5": 29.79633331298828, + "max_norm/layer6": 20.452802658081055, + "max_norm/layer7": 25.421403884887695, + "max_norm/layer8": 25.46021270751953, + "max_norm/layer9": 25.197437286376953, + "mean_norm": 10.387797482311726, + "mean_norm/layer0": 9.938105344772339, + "mean_norm/layer1": 9.893487989902496, + "mean_norm/layer10": 10.250402808189392, + "mean_norm/layer11": 10.520434379577637, + "mean_norm/layer12": 10.96678900718689, + "mean_norm/layer13": 10.227465033531189, + "mean_norm/layer14": 10.580823600292206, + "mean_norm/layer15": 10.856427371501923, + "mean_norm/layer16": 10.314347922801971, + "mean_norm/layer17": 10.761028468608856, + "mean_norm/layer18": 10.369467556476593, + "mean_norm/layer19": 10.408168733119965, + "mean_norm/layer2": 8.753524899482727, + "mean_norm/layer20": 10.516979813575745, + "mean_norm/layer21": 10.47218245267868, + "mean_norm/layer22": 11.329629778862, + "mean_norm/layer23": 11.277422606945038, + "mean_norm/layer3": 10.75775521993637, + "mean_norm/layer4": 9.766146004199982, + "mean_norm/layer5": 11.799201905727386, + "mean_norm/layer6": 9.35314804315567, + "mean_norm/layer7": 9.804097712039948, + "mean_norm/layer8": 10.22478049993515, + "mean_norm/layer9": 10.165322422981262, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8050 + }, + { + "epoch": 3.36, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46359864202187856, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7321524620056152, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9139, + "eval_samples_per_second": 20.228, + "eval_steps_per_second": 0.671, + "step": 8050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.38, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5672, + "max_norm": 29.917709350585938, + "max_norm/layer0": 23.026636123657227, + "max_norm/layer1": 24.44870376586914, + "max_norm/layer10": 26.026018142700195, + "max_norm/layer11": 24.52729034423828, + "max_norm/layer12": 26.678749084472656, + "max_norm/layer13": 23.003549575805664, + "max_norm/layer14": 24.862823486328125, + "max_norm/layer15": 29.15134048461914, + "max_norm/layer16": 24.638816833496094, + "max_norm/layer17": 28.92781639099121, + "max_norm/layer18": 25.733177185058594, + "max_norm/layer19": 25.097875595092773, + "max_norm/layer2": 19.571752548217773, + "max_norm/layer20": 26.306419372558594, + "max_norm/layer21": 25.732044219970703, + "max_norm/layer22": 26.59418296813965, + "max_norm/layer23": 25.56702995300293, + "max_norm/layer3": 23.995433807373047, + "max_norm/layer4": 23.631168365478516, + "max_norm/layer5": 29.917709350585938, + "max_norm/layer6": 20.507673263549805, + "max_norm/layer7": 25.506603240966797, + "max_norm/layer8": 25.542097091674805, + "max_norm/layer9": 25.293928146362305, + "mean_norm": 10.398542570571104, + "mean_norm/layer0": 9.950576424598694, + "mean_norm/layer1": 9.903380393981934, + "mean_norm/layer10": 10.2602379322052, + "mean_norm/layer11": 10.531521320343018, + "mean_norm/layer12": 10.980621695518494, + "mean_norm/layer13": 10.237708628177643, + "mean_norm/layer14": 10.592123091220856, + "mean_norm/layer15": 10.86921912431717, + "mean_norm/layer16": 10.324528396129608, + "mean_norm/layer17": 10.772493362426758, + "mean_norm/layer18": 10.379202902317047, + "mean_norm/layer19": 10.41831624507904, + "mean_norm/layer2": 8.757138550281525, + "mean_norm/layer20": 10.527169048786163, + "mean_norm/layer21": 10.482528150081635, + "mean_norm/layer22": 11.343506574630737, + "mean_norm/layer23": 11.291179537773132, + "mean_norm/layer3": 10.771021962165833, + "mean_norm/layer4": 9.77420699596405, + "mean_norm/layer5": 11.816980540752411, + "mean_norm/layer6": 9.359247148036957, + "mean_norm/layer7": 9.812303245067596, + "mean_norm/layer8": 10.234733879566193, + "mean_norm/layer9": 10.17507654428482, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8100 + }, + { + "epoch": 3.38, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46344856678145396, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7265894412994385, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.773, + "eval_samples_per_second": 20.471, + "eval_steps_per_second": 0.68, + "step": 8100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.4, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5544, + "max_norm": 30.036163330078125, + "max_norm/layer0": 23.137466430664062, + "max_norm/layer1": 24.516328811645508, + "max_norm/layer10": 26.114761352539062, + "max_norm/layer11": 24.583471298217773, + "max_norm/layer12": 26.794891357421875, + "max_norm/layer13": 23.09189224243164, + "max_norm/layer14": 24.96297264099121, + "max_norm/layer15": 29.24390983581543, + "max_norm/layer16": 24.714712142944336, + "max_norm/layer17": 29.043437957763672, + "max_norm/layer18": 25.807891845703125, + "max_norm/layer19": 25.197919845581055, + "max_norm/layer2": 19.644575119018555, + "max_norm/layer20": 26.390174865722656, + "max_norm/layer21": 25.839521408081055, + "max_norm/layer22": 26.697118759155273, + "max_norm/layer23": 25.650402069091797, + "max_norm/layer3": 24.080507278442383, + "max_norm/layer4": 23.73740577697754, + "max_norm/layer5": 30.036163330078125, + "max_norm/layer6": 20.57171058654785, + "max_norm/layer7": 25.5966739654541, + "max_norm/layer8": 25.62618637084961, + "max_norm/layer9": 25.398679733276367, + "mean_norm": 10.409372217953205, + "mean_norm/layer0": 9.963123381137848, + "mean_norm/layer1": 9.913290679454803, + "mean_norm/layer10": 10.270268023014069, + "mean_norm/layer11": 10.542797803878784, + "mean_norm/layer12": 10.994561910629272, + "mean_norm/layer13": 10.248073875904083, + "mean_norm/layer14": 10.603521823883057, + "mean_norm/layer15": 10.882000625133514, + "mean_norm/layer16": 10.334827065467834, + "mean_norm/layer17": 10.784078478813171, + "mean_norm/layer18": 10.389080286026001, + "mean_norm/layer19": 10.428483843803406, + "mean_norm/layer2": 8.760785043239594, + "mean_norm/layer20": 10.537615478038788, + "mean_norm/layer21": 10.492811977863312, + "mean_norm/layer22": 11.357585430145264, + "mean_norm/layer23": 11.305007696151733, + "mean_norm/layer3": 10.784351646900177, + "mean_norm/layer4": 9.78234201669693, + "mean_norm/layer5": 11.834979832172394, + "mean_norm/layer6": 9.365468978881836, + "mean_norm/layer7": 9.820427119731903, + "mean_norm/layer8": 10.244697272777557, + "mean_norm/layer9": 10.184752941131592, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8150 + }, + { + "epoch": 3.4, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4645639908656908, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7237918376922607, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9291, + "eval_samples_per_second": 20.203, + "eval_steps_per_second": 0.671, + "step": 8150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.42, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5709, + "max_norm": 30.166780471801758, + "max_norm/layer0": 23.243453979492188, + "max_norm/layer1": 24.587581634521484, + "max_norm/layer10": 26.202739715576172, + "max_norm/layer11": 24.643613815307617, + "max_norm/layer12": 26.904972076416016, + "max_norm/layer13": 23.170438766479492, + "max_norm/layer14": 25.052398681640625, + "max_norm/layer15": 29.362018585205078, + "max_norm/layer16": 24.78993034362793, + "max_norm/layer17": 29.15652847290039, + "max_norm/layer18": 25.90541648864746, + "max_norm/layer19": 25.296329498291016, + "max_norm/layer2": 19.711423873901367, + "max_norm/layer20": 26.483051300048828, + "max_norm/layer21": 25.928726196289062, + "max_norm/layer22": 26.79326629638672, + "max_norm/layer23": 25.732973098754883, + "max_norm/layer3": 24.16873550415039, + "max_norm/layer4": 23.828855514526367, + "max_norm/layer5": 30.166780471801758, + "max_norm/layer6": 20.63398551940918, + "max_norm/layer7": 25.68387794494629, + "max_norm/layer8": 25.716650009155273, + "max_norm/layer9": 25.49351692199707, + "mean_norm": 10.420199210445086, + "mean_norm/layer0": 9.975629687309265, + "mean_norm/layer1": 9.923239886760712, + "mean_norm/layer10": 10.280281364917755, + "mean_norm/layer11": 10.553914904594421, + "mean_norm/layer12": 11.008561134338379, + "mean_norm/layer13": 10.25827956199646, + "mean_norm/layer14": 10.61497974395752, + "mean_norm/layer15": 10.894914627075195, + "mean_norm/layer16": 10.345185399055481, + "mean_norm/layer17": 10.795701205730438, + "mean_norm/layer18": 10.398858368396759, + "mean_norm/layer19": 10.43862897157669, + "mean_norm/layer2": 8.76432204246521, + "mean_norm/layer20": 10.54761826992035, + "mean_norm/layer21": 10.503165245056152, + "mean_norm/layer22": 11.37176662683487, + "mean_norm/layer23": 11.318861424922943, + "mean_norm/layer3": 10.797767579555511, + "mean_norm/layer4": 9.79049038887024, + "mean_norm/layer5": 11.852981925010681, + "mean_norm/layer6": 9.371674835681915, + "mean_norm/layer7": 9.828672230243683, + "mean_norm/layer8": 10.254789173603058, + "mean_norm/layer9": 10.19449645280838, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8200 + }, + { + "epoch": 3.42, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46372032464924984, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7265851497650146, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9418, + "eval_samples_per_second": 20.181, + "eval_steps_per_second": 0.67, + "step": 8200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.44, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5516, + "max_norm": 30.276281356811523, + "max_norm/layer0": 23.351200103759766, + "max_norm/layer1": 24.666385650634766, + "max_norm/layer10": 26.298505783081055, + "max_norm/layer11": 24.71743392944336, + "max_norm/layer12": 27.001976013183594, + "max_norm/layer13": 23.236825942993164, + "max_norm/layer14": 25.13396644592285, + "max_norm/layer15": 29.4676513671875, + "max_norm/layer16": 24.866540908813477, + "max_norm/layer17": 29.276226043701172, + "max_norm/layer18": 26.03716278076172, + "max_norm/layer19": 25.378047943115234, + "max_norm/layer2": 19.76215934753418, + "max_norm/layer20": 26.57210922241211, + "max_norm/layer21": 26.011999130249023, + "max_norm/layer22": 26.882152557373047, + "max_norm/layer23": 25.821067810058594, + "max_norm/layer3": 24.24490737915039, + "max_norm/layer4": 23.920644760131836, + "max_norm/layer5": 30.276281356811523, + "max_norm/layer6": 20.692121505737305, + "max_norm/layer7": 25.77505874633789, + "max_norm/layer8": 25.806955337524414, + "max_norm/layer9": 25.58926773071289, + "mean_norm": 10.430931073923906, + "mean_norm/layer0": 9.98804497718811, + "mean_norm/layer1": 9.933098196983337, + "mean_norm/layer10": 10.290146708488464, + "mean_norm/layer11": 10.565122425556183, + "mean_norm/layer12": 11.022390842437744, + "mean_norm/layer13": 10.268523097038269, + "mean_norm/layer14": 10.62632930278778, + "mean_norm/layer15": 10.907580077648163, + "mean_norm/layer16": 10.35539186000824, + "mean_norm/layer17": 10.807102382183075, + "mean_norm/layer18": 10.408660113811493, + "mean_norm/layer19": 10.448697566986084, + "mean_norm/layer2": 8.767856657505035, + "mean_norm/layer20": 10.557779371738434, + "mean_norm/layer21": 10.513407111167908, + "mean_norm/layer22": 11.38557916879654, + "mean_norm/layer23": 11.332580626010895, + "mean_norm/layer3": 10.811109960079193, + "mean_norm/layer4": 9.798513650894165, + "mean_norm/layer5": 11.87085086107254, + "mean_norm/layer6": 9.377831220626831, + "mean_norm/layer7": 9.836784183979034, + "mean_norm/layer8": 10.264754116535187, + "mean_norm/layer9": 10.204211294651031, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8250 + }, + { + "epoch": 3.44, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46428006473515776, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7251768112182617, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7806, + "eval_samples_per_second": 20.457, + "eval_steps_per_second": 0.679, + "step": 8250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.47, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5684, + "max_norm": 30.39374351501465, + "max_norm/layer0": 23.451919555664062, + "max_norm/layer1": 24.738218307495117, + "max_norm/layer10": 26.394065856933594, + "max_norm/layer11": 24.77541732788086, + "max_norm/layer12": 27.105628967285156, + "max_norm/layer13": 23.32464027404785, + "max_norm/layer14": 25.2191162109375, + "max_norm/layer15": 29.590665817260742, + "max_norm/layer16": 24.959054946899414, + "max_norm/layer17": 29.399641036987305, + "max_norm/layer18": 26.127994537353516, + "max_norm/layer19": 25.49078941345215, + "max_norm/layer2": 19.80423927307129, + "max_norm/layer20": 26.659399032592773, + "max_norm/layer21": 26.106576919555664, + "max_norm/layer22": 26.97296905517578, + "max_norm/layer23": 25.90880584716797, + "max_norm/layer3": 24.324474334716797, + "max_norm/layer4": 24.0111083984375, + "max_norm/layer5": 30.39374351501465, + "max_norm/layer6": 20.750532150268555, + "max_norm/layer7": 25.87520980834961, + "max_norm/layer8": 25.891870498657227, + "max_norm/layer9": 25.693950653076172, + "mean_norm": 10.441620844105879, + "mean_norm/layer0": 10.000455558300018, + "mean_norm/layer1": 9.942868113517761, + "mean_norm/layer10": 10.300001859664917, + "mean_norm/layer11": 10.5762220621109, + "mean_norm/layer12": 11.036210000514984, + "mean_norm/layer13": 10.27873706817627, + "mean_norm/layer14": 10.63762879371643, + "mean_norm/layer15": 10.920246362686157, + "mean_norm/layer16": 10.365561723709106, + "mean_norm/layer17": 10.818557620048523, + "mean_norm/layer18": 10.418470799922943, + "mean_norm/layer19": 10.458708882331848, + "mean_norm/layer2": 8.771406590938568, + "mean_norm/layer20": 10.567735850811005, + "mean_norm/layer21": 10.523515522480011, + "mean_norm/layer22": 11.399278342723846, + "mean_norm/layer23": 11.346218764781952, + "mean_norm/layer3": 10.824534296989441, + "mean_norm/layer4": 9.806449353694916, + "mean_norm/layer5": 11.888680815696716, + "mean_norm/layer6": 9.383990585803986, + "mean_norm/layer7": 9.844885289669037, + "mean_norm/layer8": 10.274694323539734, + "mean_norm/layer9": 10.213841676712036, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8300 + }, + { + "epoch": 3.47, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46520079661560054, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7237327098846436, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9328, + "eval_samples_per_second": 20.196, + "eval_steps_per_second": 0.67, + "step": 8300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.49, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5825, + "max_norm": 30.522048950195312, + "max_norm/layer0": 23.55970573425293, + "max_norm/layer1": 24.81685447692871, + "max_norm/layer10": 26.48958396911621, + "max_norm/layer11": 24.84947395324707, + "max_norm/layer12": 27.182397842407227, + "max_norm/layer13": 23.40679168701172, + "max_norm/layer14": 25.298507690429688, + "max_norm/layer15": 29.69232749938965, + "max_norm/layer16": 25.0523624420166, + "max_norm/layer17": 29.538833618164062, + "max_norm/layer18": 26.200260162353516, + "max_norm/layer19": 25.59515380859375, + "max_norm/layer2": 19.851430892944336, + "max_norm/layer20": 26.742952346801758, + "max_norm/layer21": 26.21401596069336, + "max_norm/layer22": 27.071521759033203, + "max_norm/layer23": 25.991113662719727, + "max_norm/layer3": 24.40773582458496, + "max_norm/layer4": 24.08420753479004, + "max_norm/layer5": 30.522048950195312, + "max_norm/layer6": 20.804243087768555, + "max_norm/layer7": 25.957096099853516, + "max_norm/layer8": 25.9805965423584, + "max_norm/layer9": 25.79876708984375, + "mean_norm": 10.452224182585875, + "mean_norm/layer0": 10.012845158576965, + "mean_norm/layer1": 9.95258343219757, + "mean_norm/layer10": 10.309782326221466, + "mean_norm/layer11": 10.58720487356186, + "mean_norm/layer12": 11.049781918525696, + "mean_norm/layer13": 10.288818776607513, + "mean_norm/layer14": 10.648904502391815, + "mean_norm/layer15": 10.932937741279602, + "mean_norm/layer16": 10.375604629516602, + "mean_norm/layer17": 10.829921543598175, + "mean_norm/layer18": 10.428043961524963, + "mean_norm/layer19": 10.468553483486176, + "mean_norm/layer2": 8.774953544139862, + "mean_norm/layer20": 10.577674269676208, + "mean_norm/layer21": 10.533466219902039, + "mean_norm/layer22": 11.413104712963104, + "mean_norm/layer23": 11.359838545322418, + "mean_norm/layer3": 10.837815344333649, + "mean_norm/layer4": 9.814239382743835, + "mean_norm/layer5": 11.906380355358124, + "mean_norm/layer6": 9.39007294178009, + "mean_norm/layer7": 9.852976441383362, + "mean_norm/layer8": 10.284550070762634, + "mean_norm/layer9": 10.223326206207275, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8350 + }, + { + "epoch": 3.49, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4650101604993855, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7208874225616455, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.9067, + "eval_samples_per_second": 22.096, + "eval_steps_per_second": 0.733, + "step": 8350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.51, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5674, + "max_norm": 30.639392852783203, + "max_norm/layer0": 23.658632278442383, + "max_norm/layer1": 24.890296936035156, + "max_norm/layer10": 26.574634552001953, + "max_norm/layer11": 24.93674659729004, + "max_norm/layer12": 27.2740478515625, + "max_norm/layer13": 23.50137710571289, + "max_norm/layer14": 25.371257781982422, + "max_norm/layer15": 29.808671951293945, + "max_norm/layer16": 25.12998390197754, + "max_norm/layer17": 29.665565490722656, + "max_norm/layer18": 26.2768497467041, + "max_norm/layer19": 25.701955795288086, + "max_norm/layer2": 19.902111053466797, + "max_norm/layer20": 26.831134796142578, + "max_norm/layer21": 26.28788948059082, + "max_norm/layer22": 27.162761688232422, + "max_norm/layer23": 26.07558250427246, + "max_norm/layer3": 24.493680953979492, + "max_norm/layer4": 24.156644821166992, + "max_norm/layer5": 30.639392852783203, + "max_norm/layer6": 20.861595153808594, + "max_norm/layer7": 26.031085968017578, + "max_norm/layer8": 26.07181167602539, + "max_norm/layer9": 25.8958740234375, + "mean_norm": 10.462683290243149, + "mean_norm/layer0": 10.02505087852478, + "mean_norm/layer1": 9.962117493152618, + "mean_norm/layer10": 10.319499015808105, + "mean_norm/layer11": 10.598048448562622, + "mean_norm/layer12": 11.06323504447937, + "mean_norm/layer13": 10.298875629901886, + "mean_norm/layer14": 10.660021245479584, + "mean_norm/layer15": 10.945443570613861, + "mean_norm/layer16": 10.38556182384491, + "mean_norm/layer17": 10.84118789434433, + "mean_norm/layer18": 10.43755179643631, + "mean_norm/layer19": 10.47838807106018, + "mean_norm/layer2": 8.778468549251556, + "mean_norm/layer20": 10.587294101715088, + "mean_norm/layer21": 10.54331248998642, + "mean_norm/layer22": 11.42659991979599, + "mean_norm/layer23": 11.373156070709229, + "mean_norm/layer3": 10.850870013237, + "mean_norm/layer4": 9.821917593479156, + "mean_norm/layer5": 11.923875868320465, + "mean_norm/layer6": 9.39600282907486, + "mean_norm/layer7": 9.860944926738739, + "mean_norm/layer8": 10.294282972812653, + "mean_norm/layer9": 10.23269271850586, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8400 + }, + { + "epoch": 3.51, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4650669457254921, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.718179702758789, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.889, + "eval_samples_per_second": 22.132, + "eval_steps_per_second": 0.735, + "step": 8400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.53, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5798, + "max_norm": 30.766651153564453, + "max_norm/layer0": 23.751983642578125, + "max_norm/layer1": 24.96283531188965, + "max_norm/layer10": 26.6643009185791, + "max_norm/layer11": 25.018144607543945, + "max_norm/layer12": 27.3858699798584, + "max_norm/layer13": 23.57953453063965, + "max_norm/layer14": 25.471681594848633, + "max_norm/layer15": 29.91374969482422, + "max_norm/layer16": 25.209827423095703, + "max_norm/layer17": 29.779539108276367, + "max_norm/layer18": 26.364397048950195, + "max_norm/layer19": 25.807302474975586, + "max_norm/layer2": 19.943843841552734, + "max_norm/layer20": 26.922224044799805, + "max_norm/layer21": 26.374265670776367, + "max_norm/layer22": 27.24306869506836, + "max_norm/layer23": 26.16399383544922, + "max_norm/layer3": 24.571680068969727, + "max_norm/layer4": 24.2481689453125, + "max_norm/layer5": 30.766651153564453, + "max_norm/layer6": 20.909099578857422, + "max_norm/layer7": 26.11029624938965, + "max_norm/layer8": 26.175079345703125, + "max_norm/layer9": 25.993101119995117, + "mean_norm": 10.473153608540693, + "mean_norm/layer0": 10.037110924720764, + "mean_norm/layer1": 9.971767902374268, + "mean_norm/layer10": 10.329081892967224, + "mean_norm/layer11": 10.608945548534393, + "mean_norm/layer12": 11.076784670352936, + "mean_norm/layer13": 10.308919906616211, + "mean_norm/layer14": 10.671100199222565, + "mean_norm/layer15": 10.958038628101349, + "mean_norm/layer16": 10.395552039146423, + "mean_norm/layer17": 10.852413356304169, + "mean_norm/layer18": 10.447036266326904, + "mean_norm/layer19": 10.488157510757446, + "mean_norm/layer2": 8.781982839107513, + "mean_norm/layer20": 10.596912443637848, + "mean_norm/layer21": 10.553145587444305, + "mean_norm/layer22": 11.439911663532257, + "mean_norm/layer23": 11.386568009853363, + "mean_norm/layer3": 10.86396187543869, + "mean_norm/layer4": 9.82959532737732, + "mean_norm/layer5": 11.941483497619629, + "mean_norm/layer6": 9.401970863342285, + "mean_norm/layer7": 9.869019269943237, + "mean_norm/layer8": 10.30410349369049, + "mean_norm/layer9": 10.242122888565063, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8450 + }, + { + "epoch": 3.53, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4649087583099094, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7157468795776367, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9398, + "eval_samples_per_second": 20.185, + "eval_steps_per_second": 0.67, + "step": 8450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.55, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5788, + "max_norm": 30.9117374420166, + "max_norm/layer0": 23.839109420776367, + "max_norm/layer1": 25.04669761657715, + "max_norm/layer10": 26.760334014892578, + "max_norm/layer11": 25.07632827758789, + "max_norm/layer12": 27.48368263244629, + "max_norm/layer13": 23.673465728759766, + "max_norm/layer14": 25.5750675201416, + "max_norm/layer15": 30.018980026245117, + "max_norm/layer16": 25.29213523864746, + "max_norm/layer17": 29.91062355041504, + "max_norm/layer18": 26.471200942993164, + "max_norm/layer19": 25.893930435180664, + "max_norm/layer2": 20.0001220703125, + "max_norm/layer20": 27.020864486694336, + "max_norm/layer21": 26.478113174438477, + "max_norm/layer22": 27.32907485961914, + "max_norm/layer23": 26.25127410888672, + "max_norm/layer3": 24.64104652404785, + "max_norm/layer4": 24.34300994873047, + "max_norm/layer5": 30.9117374420166, + "max_norm/layer6": 20.962677001953125, + "max_norm/layer7": 26.191547393798828, + "max_norm/layer8": 26.274858474731445, + "max_norm/layer9": 26.109769821166992, + "mean_norm": 10.483579012254873, + "mean_norm/layer0": 10.04910922050476, + "mean_norm/layer1": 9.981406450271606, + "mean_norm/layer10": 10.33859497308731, + "mean_norm/layer11": 10.619703590869904, + "mean_norm/layer12": 11.090156137943268, + "mean_norm/layer13": 10.31883031129837, + "mean_norm/layer14": 10.682014226913452, + "mean_norm/layer15": 10.970479130744934, + "mean_norm/layer16": 10.405543386936188, + "mean_norm/layer17": 10.863610625267029, + "mean_norm/layer18": 10.4564608335495, + "mean_norm/layer19": 10.497778236865997, + "mean_norm/layer2": 8.785513758659363, + "mean_norm/layer20": 10.606768667697906, + "mean_norm/layer21": 10.5628901720047, + "mean_norm/layer22": 11.453165590763092, + "mean_norm/layer23": 11.399942815303802, + "mean_norm/layer3": 10.876989305019379, + "mean_norm/layer4": 9.837391912937164, + "mean_norm/layer5": 11.959004819393158, + "mean_norm/layer6": 9.407935559749603, + "mean_norm/layer7": 9.877058207988739, + "mean_norm/layer8": 10.313934981822968, + "mean_norm/layer9": 10.25161337852478, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8500 + }, + { + "epoch": 3.55, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46567130277476954, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.716278314590454, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9286, + "eval_samples_per_second": 20.203, + "eval_steps_per_second": 0.671, + "step": 8500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.57, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.574, + "max_norm": 31.035043716430664, + "max_norm/layer0": 23.93219757080078, + "max_norm/layer1": 25.118915557861328, + "max_norm/layer10": 26.85211181640625, + "max_norm/layer11": 25.140438079833984, + "max_norm/layer12": 27.57324981689453, + "max_norm/layer13": 23.7674503326416, + "max_norm/layer14": 25.660987854003906, + "max_norm/layer15": 30.117841720581055, + "max_norm/layer16": 25.384872436523438, + "max_norm/layer17": 30.02664566040039, + "max_norm/layer18": 26.555728912353516, + "max_norm/layer19": 25.99490737915039, + "max_norm/layer2": 20.0588436126709, + "max_norm/layer20": 27.112516403198242, + "max_norm/layer21": 26.563764572143555, + "max_norm/layer22": 27.413936614990234, + "max_norm/layer23": 26.341724395751953, + "max_norm/layer3": 24.70960235595703, + "max_norm/layer4": 24.425901412963867, + "max_norm/layer5": 31.035043716430664, + "max_norm/layer6": 21.027484893798828, + "max_norm/layer7": 26.281536102294922, + "max_norm/layer8": 26.368459701538086, + "max_norm/layer9": 26.20467185974121, + "mean_norm": 10.494121707975864, + "mean_norm/layer0": 10.061342477798462, + "mean_norm/layer1": 9.99113255739212, + "mean_norm/layer10": 10.348263144493103, + "mean_norm/layer11": 10.630640387535095, + "mean_norm/layer12": 11.10374128818512, + "mean_norm/layer13": 10.32883608341217, + "mean_norm/layer14": 10.693177998065948, + "mean_norm/layer15": 10.983099639415741, + "mean_norm/layer16": 10.415638208389282, + "mean_norm/layer17": 10.874902606010437, + "mean_norm/layer18": 10.465932965278625, + "mean_norm/layer19": 10.507543802261353, + "mean_norm/layer2": 8.789079010486603, + "mean_norm/layer20": 10.616671085357666, + "mean_norm/layer21": 10.572692036628723, + "mean_norm/layer22": 11.466717422008514, + "mean_norm/layer23": 11.413405001163483, + "mean_norm/layer3": 10.890101253986359, + "mean_norm/layer4": 9.845227479934692, + "mean_norm/layer5": 11.9767746925354, + "mean_norm/layer6": 9.41396027803421, + "mean_norm/layer7": 9.885132670402527, + "mean_norm/layer8": 10.323809742927551, + "mean_norm/layer9": 10.26109915971756, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8550 + }, + { + "epoch": 3.57, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4657078075629809, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7177693843841553, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7202, + "eval_samples_per_second": 20.563, + "eval_steps_per_second": 0.683, + "step": 8550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.59, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5612, + "max_norm": 31.140310287475586, + "max_norm/layer0": 24.02177619934082, + "max_norm/layer1": 25.188316345214844, + "max_norm/layer10": 26.956527709960938, + "max_norm/layer11": 25.21898651123047, + "max_norm/layer12": 27.661983489990234, + "max_norm/layer13": 23.849395751953125, + "max_norm/layer14": 25.733461380004883, + "max_norm/layer15": 30.240049362182617, + "max_norm/layer16": 25.489137649536133, + "max_norm/layer17": 30.150360107421875, + "max_norm/layer18": 26.642009735107422, + "max_norm/layer19": 26.0812931060791, + "max_norm/layer2": 20.112157821655273, + "max_norm/layer20": 27.20627212524414, + "max_norm/layer21": 26.658498764038086, + "max_norm/layer22": 27.516849517822266, + "max_norm/layer23": 26.427011489868164, + "max_norm/layer3": 24.779708862304688, + "max_norm/layer4": 24.51090431213379, + "max_norm/layer5": 31.140310287475586, + "max_norm/layer6": 21.10075569152832, + "max_norm/layer7": 26.379568099975586, + "max_norm/layer8": 26.46396827697754, + "max_norm/layer9": 26.29374885559082, + "mean_norm": 10.504519318540892, + "mean_norm/layer0": 10.073370933532715, + "mean_norm/layer1": 10.000800788402557, + "mean_norm/layer10": 10.357769906520844, + "mean_norm/layer11": 10.6414253115654, + "mean_norm/layer12": 11.117177963256836, + "mean_norm/layer13": 10.33878743648529, + "mean_norm/layer14": 10.704220652580261, + "mean_norm/layer15": 10.995559275150299, + "mean_norm/layer16": 10.425552606582642, + "mean_norm/layer17": 10.886011600494385, + "mean_norm/layer18": 10.475245594978333, + "mean_norm/layer19": 10.51713490486145, + "mean_norm/layer2": 8.792496740818024, + "mean_norm/layer20": 10.626440286636353, + "mean_norm/layer21": 10.582411348819733, + "mean_norm/layer22": 11.480081796646118, + "mean_norm/layer23": 11.42665684223175, + "mean_norm/layer3": 10.903161942958832, + "mean_norm/layer4": 9.852953791618347, + "mean_norm/layer5": 11.994223237037659, + "mean_norm/layer6": 9.419936060905457, + "mean_norm/layer7": 9.893079459667206, + "mean_norm/layer8": 10.33350384235382, + "mean_norm/layer9": 10.270461320877075, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8600 + }, + { + "epoch": 3.59, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46590655585435403, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7106266021728516, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9154, + "eval_samples_per_second": 20.226, + "eval_steps_per_second": 0.671, + "step": 8600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.61, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5816, + "max_norm": 31.250791549682617, + "max_norm/layer0": 24.110010147094727, + "max_norm/layer1": 25.280006408691406, + "max_norm/layer10": 27.059661865234375, + "max_norm/layer11": 25.282930374145508, + "max_norm/layer12": 27.764455795288086, + "max_norm/layer13": 23.927961349487305, + "max_norm/layer14": 25.809751510620117, + "max_norm/layer15": 30.362098693847656, + "max_norm/layer16": 25.56882667541504, + "max_norm/layer17": 30.28155517578125, + "max_norm/layer18": 26.721351623535156, + "max_norm/layer19": 26.17807960510254, + "max_norm/layer2": 20.16436004638672, + "max_norm/layer20": 27.294723510742188, + "max_norm/layer21": 26.74715805053711, + "max_norm/layer22": 27.608800888061523, + "max_norm/layer23": 26.51601219177246, + "max_norm/layer3": 24.850908279418945, + "max_norm/layer4": 24.58802604675293, + "max_norm/layer5": 31.250791549682617, + "max_norm/layer6": 21.15802764892578, + "max_norm/layer7": 26.47740364074707, + "max_norm/layer8": 26.554189682006836, + "max_norm/layer9": 26.38273811340332, + "mean_norm": 10.515074729919434, + "mean_norm/layer0": 10.08557814359665, + "mean_norm/layer1": 10.01053923368454, + "mean_norm/layer10": 10.367479145526886, + "mean_norm/layer11": 10.652198612689972, + "mean_norm/layer12": 11.130778849124908, + "mean_norm/layer13": 10.348851323127747, + "mean_norm/layer14": 10.71534115076065, + "mean_norm/layer15": 11.00808185338974, + "mean_norm/layer16": 10.435614585876465, + "mean_norm/layer17": 10.897213876247406, + "mean_norm/layer18": 10.484766364097595, + "mean_norm/layer19": 10.527069389820099, + "mean_norm/layer2": 8.796098411083221, + "mean_norm/layer20": 10.636413216590881, + "mean_norm/layer21": 10.592262923717499, + "mean_norm/layer22": 11.493712186813354, + "mean_norm/layer23": 11.440210998058319, + "mean_norm/layer3": 10.916420876979828, + "mean_norm/layer4": 9.86082011461258, + "mean_norm/layer5": 12.011876881122589, + "mean_norm/layer6": 9.425954461097717, + "mean_norm/layer7": 9.901139974594116, + "mean_norm/layer8": 10.343375980854034, + "mean_norm/layer9": 10.27999496459961, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8650 + }, + { + "epoch": 3.61, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46609313588299, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7121775150299072, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.9234, + "eval_samples_per_second": 20.212, + "eval_steps_per_second": 0.671, + "step": 8650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.63, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5695, + "max_norm": 31.358867645263672, + "max_norm/layer0": 24.205951690673828, + "max_norm/layer1": 25.37681770324707, + "max_norm/layer10": 27.143234252929688, + "max_norm/layer11": 25.367061614990234, + "max_norm/layer12": 27.863758087158203, + "max_norm/layer13": 24.005512237548828, + "max_norm/layer14": 25.879533767700195, + "max_norm/layer15": 30.467557907104492, + "max_norm/layer16": 25.646121978759766, + "max_norm/layer17": 30.41017723083496, + "max_norm/layer18": 26.787418365478516, + "max_norm/layer19": 26.29683494567871, + "max_norm/layer2": 20.221500396728516, + "max_norm/layer20": 27.37459945678711, + "max_norm/layer21": 26.828081130981445, + "max_norm/layer22": 27.710824966430664, + "max_norm/layer23": 26.605989456176758, + "max_norm/layer3": 24.92000961303711, + "max_norm/layer4": 24.675378799438477, + "max_norm/layer5": 31.358867645263672, + "max_norm/layer6": 21.21007537841797, + "max_norm/layer7": 26.560998916625977, + "max_norm/layer8": 26.642372131347656, + "max_norm/layer9": 26.490453720092773, + "mean_norm": 10.525502522786459, + "mean_norm/layer0": 10.09764415025711, + "mean_norm/layer1": 10.020213961601257, + "mean_norm/layer10": 10.37711900472641, + "mean_norm/layer11": 10.662993669509888, + "mean_norm/layer12": 11.144181966781616, + "mean_norm/layer13": 10.35890543460846, + "mean_norm/layer14": 10.726293087005615, + "mean_norm/layer15": 11.02056634426117, + "mean_norm/layer16": 10.445514619350433, + "mean_norm/layer17": 10.908413589000702, + "mean_norm/layer18": 10.49404126405716, + "mean_norm/layer19": 10.536761999130249, + "mean_norm/layer2": 8.7996466755867, + "mean_norm/layer20": 10.646133005619049, + "mean_norm/layer21": 10.602025330066681, + "mean_norm/layer22": 11.50708258152008, + "mean_norm/layer23": 11.453619003295898, + "mean_norm/layer3": 10.929427862167358, + "mean_norm/layer4": 9.868574559688568, + "mean_norm/layer5": 12.029329001903534, + "mean_norm/layer6": 9.431976199150085, + "mean_norm/layer7": 9.909065783023834, + "mean_norm/layer8": 10.353107631206512, + "mean_norm/layer9": 10.289423823356628, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8700 + }, + { + "epoch": 3.63, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46699358732553753, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.709040403366089, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.923, + "eval_samples_per_second": 20.213, + "eval_steps_per_second": 0.671, + "step": 8700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.65, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5743, + "max_norm": 31.462026596069336, + "max_norm/layer0": 24.306140899658203, + "max_norm/layer1": 25.461463928222656, + "max_norm/layer10": 27.22161865234375, + "max_norm/layer11": 25.44947624206543, + "max_norm/layer12": 27.968080520629883, + "max_norm/layer13": 24.1011905670166, + "max_norm/layer14": 25.971227645874023, + "max_norm/layer15": 30.586713790893555, + "max_norm/layer16": 25.736255645751953, + "max_norm/layer17": 30.536222457885742, + "max_norm/layer18": 26.88282585144043, + "max_norm/layer19": 26.426443099975586, + "max_norm/layer2": 20.280811309814453, + "max_norm/layer20": 27.453838348388672, + "max_norm/layer21": 26.928016662597656, + "max_norm/layer22": 27.80914306640625, + "max_norm/layer23": 26.693340301513672, + "max_norm/layer3": 24.99188804626465, + "max_norm/layer4": 24.771135330200195, + "max_norm/layer5": 31.462026596069336, + "max_norm/layer6": 21.271432876586914, + "max_norm/layer7": 26.657981872558594, + "max_norm/layer8": 26.73614501953125, + "max_norm/layer9": 26.60494613647461, + "mean_norm": 10.53589997192224, + "mean_norm/layer0": 10.109680235385895, + "mean_norm/layer1": 10.029725313186646, + "mean_norm/layer10": 10.386717557907104, + "mean_norm/layer11": 10.673824787139893, + "mean_norm/layer12": 11.15762722492218, + "mean_norm/layer13": 10.36895900964737, + "mean_norm/layer14": 10.7372505068779, + "mean_norm/layer15": 11.032996237277985, + "mean_norm/layer16": 10.455421268939972, + "mean_norm/layer17": 10.91942673921585, + "mean_norm/layer18": 10.503340184688568, + "mean_norm/layer19": 10.546266198158264, + "mean_norm/layer2": 8.803168833255768, + "mean_norm/layer20": 10.655834794044495, + "mean_norm/layer21": 10.611751914024353, + "mean_norm/layer22": 11.520513951778412, + "mean_norm/layer23": 11.466938018798828, + "mean_norm/layer3": 10.942326188087463, + "mean_norm/layer4": 9.876272022724152, + "mean_norm/layer5": 12.046761870384216, + "mean_norm/layer6": 9.438043534755707, + "mean_norm/layer7": 9.917055368423462, + "mean_norm/layer8": 10.362797379493713, + "mean_norm/layer9": 10.298900187015533, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8750 + }, + { + "epoch": 3.65, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4673708034703885, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7044708728790283, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8474, + "eval_samples_per_second": 20.342, + "eval_steps_per_second": 0.675, + "step": 8750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.67, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5789, + "max_norm": 31.572891235351562, + "max_norm/layer0": 24.410261154174805, + "max_norm/layer1": 25.558263778686523, + "max_norm/layer10": 27.304840087890625, + "max_norm/layer11": 25.51268196105957, + "max_norm/layer12": 28.05234146118164, + "max_norm/layer13": 24.20308494567871, + "max_norm/layer14": 26.0477352142334, + "max_norm/layer15": 30.70371437072754, + "max_norm/layer16": 25.83902931213379, + "max_norm/layer17": 30.648099899291992, + "max_norm/layer18": 27.012645721435547, + "max_norm/layer19": 26.52737808227539, + "max_norm/layer2": 20.334718704223633, + "max_norm/layer20": 27.539426803588867, + "max_norm/layer21": 27.018211364746094, + "max_norm/layer22": 27.9110107421875, + "max_norm/layer23": 26.7803955078125, + "max_norm/layer3": 25.054349899291992, + "max_norm/layer4": 24.855287551879883, + "max_norm/layer5": 31.572891235351562, + "max_norm/layer6": 21.333072662353516, + "max_norm/layer7": 26.76139259338379, + "max_norm/layer8": 26.838417053222656, + "max_norm/layer9": 26.697357177734375, + "mean_norm": 10.5463310405612, + "mean_norm/layer0": 10.121755361557007, + "mean_norm/layer1": 10.039315283298492, + "mean_norm/layer10": 10.396234333515167, + "mean_norm/layer11": 10.684642255306244, + "mean_norm/layer12": 11.171061992645264, + "mean_norm/layer13": 10.37897139787674, + "mean_norm/layer14": 10.748344361782074, + "mean_norm/layer15": 11.045448780059814, + "mean_norm/layer16": 10.465394139289856, + "mean_norm/layer17": 10.930562853813171, + "mean_norm/layer18": 10.512667119503021, + "mean_norm/layer19": 10.55586314201355, + "mean_norm/layer2": 8.806701242923737, + "mean_norm/layer20": 10.665653467178345, + "mean_norm/layer21": 10.621645450592041, + "mean_norm/layer22": 11.533875703811646, + "mean_norm/layer23": 11.480299174785614, + "mean_norm/layer3": 10.955307066440582, + "mean_norm/layer4": 9.88407689332962, + "mean_norm/layer5": 12.064229130744934, + "mean_norm/layer6": 9.444064617156982, + "mean_norm/layer7": 9.92504996061325, + "mean_norm/layer8": 10.372445940971375, + "mean_norm/layer9": 10.308335304260254, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8800 + }, + { + "epoch": 3.67, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4667907829465854, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7064690589904785, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.587, + "eval_samples_per_second": 20.799, + "eval_steps_per_second": 0.69, + "step": 8800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.7, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5744, + "max_norm": 31.6871337890625, + "max_norm/layer0": 24.510038375854492, + "max_norm/layer1": 25.655925750732422, + "max_norm/layer10": 27.37701988220215, + "max_norm/layer11": 25.585721969604492, + "max_norm/layer12": 28.144187927246094, + "max_norm/layer13": 24.291133880615234, + "max_norm/layer14": 26.127349853515625, + "max_norm/layer15": 30.831226348876953, + "max_norm/layer16": 25.930320739746094, + "max_norm/layer17": 30.755409240722656, + "max_norm/layer18": 27.11887550354004, + "max_norm/layer19": 26.618364334106445, + "max_norm/layer2": 20.38463020324707, + "max_norm/layer20": 27.650087356567383, + "max_norm/layer21": 27.109182357788086, + "max_norm/layer22": 28.00884437561035, + "max_norm/layer23": 26.86437225341797, + "max_norm/layer3": 25.138376235961914, + "max_norm/layer4": 24.935468673706055, + "max_norm/layer5": 31.6871337890625, + "max_norm/layer6": 21.40496253967285, + "max_norm/layer7": 26.854114532470703, + "max_norm/layer8": 26.91637420654297, + "max_norm/layer9": 26.789180755615234, + "mean_norm": 10.556625217199326, + "mean_norm/layer0": 10.13366448879242, + "mean_norm/layer1": 10.048774302005768, + "mean_norm/layer10": 10.405665278434753, + "mean_norm/layer11": 10.695261061191559, + "mean_norm/layer12": 11.184338688850403, + "mean_norm/layer13": 10.388884425163269, + "mean_norm/layer14": 10.759207367897034, + "mean_norm/layer15": 11.05769032239914, + "mean_norm/layer16": 10.475219130516052, + "mean_norm/layer17": 10.94150424003601, + "mean_norm/layer18": 10.5219966173172, + "mean_norm/layer19": 10.565406024456024, + "mean_norm/layer2": 8.810097455978394, + "mean_norm/layer20": 10.675190091133118, + "mean_norm/layer21": 10.631307899951935, + "mean_norm/layer22": 11.547064244747162, + "mean_norm/layer23": 11.493385910987854, + "mean_norm/layer3": 10.968357741832733, + "mean_norm/layer4": 9.891835868358612, + "mean_norm/layer5": 12.081561923027039, + "mean_norm/layer6": 9.449971437454224, + "mean_norm/layer7": 9.932962834835052, + "mean_norm/layer8": 10.38201367855072, + "mean_norm/layer9": 10.31764417886734, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8850 + }, + { + "epoch": 3.7, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46575242452635035, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7084460258483887, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8044, + "eval_samples_per_second": 22.306, + "eval_steps_per_second": 0.74, + "step": 8850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.72, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5773, + "max_norm": 31.805294036865234, + "max_norm/layer0": 24.599546432495117, + "max_norm/layer1": 25.76319122314453, + "max_norm/layer10": 27.449440002441406, + "max_norm/layer11": 25.655227661132812, + "max_norm/layer12": 28.233400344848633, + "max_norm/layer13": 24.394102096557617, + "max_norm/layer14": 26.187408447265625, + "max_norm/layer15": 30.92896270751953, + "max_norm/layer16": 26.01325035095215, + "max_norm/layer17": 30.859031677246094, + "max_norm/layer18": 27.204809188842773, + "max_norm/layer19": 26.70510482788086, + "max_norm/layer2": 20.445926666259766, + "max_norm/layer20": 27.740930557250977, + "max_norm/layer21": 27.208942413330078, + "max_norm/layer22": 28.095291137695312, + "max_norm/layer23": 26.942819595336914, + "max_norm/layer3": 25.220661163330078, + "max_norm/layer4": 25.003028869628906, + "max_norm/layer5": 31.805294036865234, + "max_norm/layer6": 21.47049903869629, + "max_norm/layer7": 26.94700813293457, + "max_norm/layer8": 27.007118225097656, + "max_norm/layer9": 26.882286071777344, + "mean_norm": 10.566929931441942, + "mean_norm/layer0": 10.145540177822113, + "mean_norm/layer1": 10.058104574680328, + "mean_norm/layer10": 10.41511994600296, + "mean_norm/layer11": 10.705998122692108, + "mean_norm/layer12": 11.197706997394562, + "mean_norm/layer13": 10.398730218410492, + "mean_norm/layer14": 10.770055413246155, + "mean_norm/layer15": 11.06999284029007, + "mean_norm/layer16": 10.485083758831024, + "mean_norm/layer17": 10.9524467587471, + "mean_norm/layer18": 10.53134435415268, + "mean_norm/layer19": 10.57489550113678, + "mean_norm/layer2": 8.813579618930817, + "mean_norm/layer20": 10.684813797473907, + "mean_norm/layer21": 10.640975952148438, + "mean_norm/layer22": 11.560323774814606, + "mean_norm/layer23": 11.50652539730072, + "mean_norm/layer3": 10.9813032746315, + "mean_norm/layer4": 9.899572908878326, + "mean_norm/layer5": 12.098863184452057, + "mean_norm/layer6": 9.455974757671356, + "mean_norm/layer7": 9.940803170204163, + "mean_norm/layer8": 10.391590774059296, + "mean_norm/layer9": 10.32697308063507, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8900 + }, + { + "epoch": 3.72, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46607691153267383, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.708861827850342, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8238, + "eval_samples_per_second": 20.383, + "eval_steps_per_second": 0.677, + "step": 8900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.74, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5772, + "max_norm": 31.916152954101562, + "max_norm/layer0": 24.676496505737305, + "max_norm/layer1": 25.85756492614746, + "max_norm/layer10": 27.528053283691406, + "max_norm/layer11": 25.73573112487793, + "max_norm/layer12": 28.318124771118164, + "max_norm/layer13": 24.479642868041992, + "max_norm/layer14": 26.248197555541992, + "max_norm/layer15": 31.052705764770508, + "max_norm/layer16": 26.09161376953125, + "max_norm/layer17": 30.966751098632812, + "max_norm/layer18": 27.3068790435791, + "max_norm/layer19": 26.7965145111084, + "max_norm/layer2": 20.522724151611328, + "max_norm/layer20": 27.823123931884766, + "max_norm/layer21": 27.323970794677734, + "max_norm/layer22": 28.17957878112793, + "max_norm/layer23": 27.034547805786133, + "max_norm/layer3": 25.299671173095703, + "max_norm/layer4": 25.082792282104492, + "max_norm/layer5": 31.916152954101562, + "max_norm/layer6": 21.534683227539062, + "max_norm/layer7": 27.028034210205078, + "max_norm/layer8": 27.088815689086914, + "max_norm/layer9": 26.969919204711914, + "mean_norm": 10.577225059270859, + "mean_norm/layer0": 10.157378554344177, + "mean_norm/layer1": 10.067561268806458, + "mean_norm/layer10": 10.424581110477448, + "mean_norm/layer11": 10.716570019721985, + "mean_norm/layer12": 11.210873186588287, + "mean_norm/layer13": 10.408523380756378, + "mean_norm/layer14": 10.78095543384552, + "mean_norm/layer15": 11.082448303699493, + "mean_norm/layer16": 10.494913518428802, + "mean_norm/layer17": 10.963443398475647, + "mean_norm/layer18": 10.540624141693115, + "mean_norm/layer19": 10.584456026554108, + "mean_norm/layer2": 8.81709498167038, + "mean_norm/layer20": 10.694341719150543, + "mean_norm/layer21": 10.650606751441956, + "mean_norm/layer22": 11.573448956012726, + "mean_norm/layer23": 11.51974767446518, + "mean_norm/layer3": 10.994216620922089, + "mean_norm/layer4": 9.90748655796051, + "mean_norm/layer5": 12.11613380908966, + "mean_norm/layer6": 9.461788892745972, + "mean_norm/layer7": 9.948690056800842, + "mean_norm/layer8": 10.401232063770294, + "mean_norm/layer9": 10.33628499507904, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 8950 + }, + { + "epoch": 3.74, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4669814190628004, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7066380977630615, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8434, + "eval_samples_per_second": 20.349, + "eval_steps_per_second": 0.675, + "step": 8950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.76, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5866, + "max_norm": 32.025630950927734, + "max_norm/layer0": 24.762939453125, + "max_norm/layer1": 25.960861206054688, + "max_norm/layer10": 27.613296508789062, + "max_norm/layer11": 25.807106018066406, + "max_norm/layer12": 28.428152084350586, + "max_norm/layer13": 24.579200744628906, + "max_norm/layer14": 26.320199966430664, + "max_norm/layer15": 31.175045013427734, + "max_norm/layer16": 26.178552627563477, + "max_norm/layer17": 31.0894832611084, + "max_norm/layer18": 27.412567138671875, + "max_norm/layer19": 26.8818359375, + "max_norm/layer2": 20.595802307128906, + "max_norm/layer20": 27.916038513183594, + "max_norm/layer21": 27.415224075317383, + "max_norm/layer22": 28.27640151977539, + "max_norm/layer23": 27.122173309326172, + "max_norm/layer3": 25.38041877746582, + "max_norm/layer4": 25.15086555480957, + "max_norm/layer5": 32.025630950927734, + "max_norm/layer6": 21.594274520874023, + "max_norm/layer7": 27.11809730529785, + "max_norm/layer8": 27.185285568237305, + "max_norm/layer9": 27.044723510742188, + "mean_norm": 10.587412876387438, + "mean_norm/layer0": 10.168988108634949, + "mean_norm/layer1": 10.076943039894104, + "mean_norm/layer10": 10.433831512928009, + "mean_norm/layer11": 10.72713315486908, + "mean_norm/layer12": 11.22397780418396, + "mean_norm/layer13": 10.418285012245178, + "mean_norm/layer14": 10.791641414165497, + "mean_norm/layer15": 11.094760477542877, + "mean_norm/layer16": 10.504680275917053, + "mean_norm/layer17": 10.974333047866821, + "mean_norm/layer18": 10.549786627292633, + "mean_norm/layer19": 10.594055414199829, + "mean_norm/layer2": 8.820539593696594, + "mean_norm/layer20": 10.703791201114655, + "mean_norm/layer21": 10.660218596458435, + "mean_norm/layer22": 11.586527645587921, + "mean_norm/layer23": 11.532706141471863, + "mean_norm/layer3": 11.007036626338959, + "mean_norm/layer4": 9.915196359157562, + "mean_norm/layer5": 12.133186936378479, + "mean_norm/layer6": 9.467587530612946, + "mean_norm/layer7": 9.95652425289154, + "mean_norm/layer8": 10.41076546907425, + "mean_norm/layer9": 10.345412790775299, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9000 + }, + { + "epoch": 3.76, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46787375833018985, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7035961151123047, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8396, + "eval_samples_per_second": 20.355, + "eval_steps_per_second": 0.676, + "step": 9000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.78, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5766, + "max_norm": 32.134735107421875, + "max_norm/layer0": 24.84881019592285, + "max_norm/layer1": 26.05401611328125, + "max_norm/layer10": 27.689804077148438, + "max_norm/layer11": 25.87973976135254, + "max_norm/layer12": 28.52071762084961, + "max_norm/layer13": 24.691492080688477, + "max_norm/layer14": 26.403806686401367, + "max_norm/layer15": 31.284221649169922, + "max_norm/layer16": 26.256942749023438, + "max_norm/layer17": 31.221664428710938, + "max_norm/layer18": 27.5086612701416, + "max_norm/layer19": 26.977436065673828, + "max_norm/layer2": 20.662620544433594, + "max_norm/layer20": 28.005910873413086, + "max_norm/layer21": 27.506736755371094, + "max_norm/layer22": 28.381319046020508, + "max_norm/layer23": 27.205909729003906, + "max_norm/layer3": 25.46193504333496, + "max_norm/layer4": 25.2278995513916, + "max_norm/layer5": 32.134735107421875, + "max_norm/layer6": 21.648170471191406, + "max_norm/layer7": 27.21436309814453, + "max_norm/layer8": 27.268877029418945, + "max_norm/layer9": 27.110942840576172, + "mean_norm": 10.597499750554562, + "mean_norm/layer0": 10.180612981319427, + "mean_norm/layer1": 10.086312234401703, + "mean_norm/layer10": 10.443076193332672, + "mean_norm/layer11": 10.737610340118408, + "mean_norm/layer12": 11.236975133419037, + "mean_norm/layer13": 10.427858173847198, + "mean_norm/layer14": 10.802227020263672, + "mean_norm/layer15": 11.106768071651459, + "mean_norm/layer16": 10.514285862445831, + "mean_norm/layer17": 10.985120475292206, + "mean_norm/layer18": 10.558781325817108, + "mean_norm/layer19": 10.603352129459381, + "mean_norm/layer2": 8.823948740959167, + "mean_norm/layer20": 10.713205635547638, + "mean_norm/layer21": 10.66967099905014, + "mean_norm/layer22": 11.59945923089981, + "mean_norm/layer23": 11.545632243156433, + "mean_norm/layer3": 11.019707977771759, + "mean_norm/layer4": 9.9228515625, + "mean_norm/layer5": 12.150153994560242, + "mean_norm/layer6": 9.473384976387024, + "mean_norm/layer7": 9.96427607536316, + "mean_norm/layer8": 10.420209109783173, + "mean_norm/layer9": 10.35451352596283, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9050 + }, + { + "epoch": 3.78, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46858357365652237, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7019236087799072, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8097, + "eval_samples_per_second": 20.407, + "eval_steps_per_second": 0.677, + "step": 9050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.8, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5811, + "max_norm": 32.24896240234375, + "max_norm/layer0": 24.925283432006836, + "max_norm/layer1": 26.151309967041016, + "max_norm/layer10": 27.78043556213379, + "max_norm/layer11": 25.97683334350586, + "max_norm/layer12": 28.626747131347656, + "max_norm/layer13": 24.789648056030273, + "max_norm/layer14": 26.49995231628418, + "max_norm/layer15": 31.411869049072266, + "max_norm/layer16": 26.331775665283203, + "max_norm/layer17": 31.348556518554688, + "max_norm/layer18": 27.602380752563477, + "max_norm/layer19": 27.07625389099121, + "max_norm/layer2": 20.733642578125, + "max_norm/layer20": 28.101778030395508, + "max_norm/layer21": 27.597261428833008, + "max_norm/layer22": 28.473896026611328, + "max_norm/layer23": 27.283172607421875, + "max_norm/layer3": 25.54083251953125, + "max_norm/layer4": 25.305072784423828, + "max_norm/layer5": 32.24896240234375, + "max_norm/layer6": 21.698518753051758, + "max_norm/layer7": 27.31633758544922, + "max_norm/layer8": 27.362085342407227, + "max_norm/layer9": 27.174236297607422, + "mean_norm": 10.60761951158444, + "mean_norm/layer0": 10.192138016223907, + "mean_norm/layer1": 10.095690608024597, + "mean_norm/layer10": 10.45243376493454, + "mean_norm/layer11": 10.748098969459534, + "mean_norm/layer12": 11.250001728534698, + "mean_norm/layer13": 10.4375701546669, + "mean_norm/layer14": 10.812869429588318, + "mean_norm/layer15": 11.118857681751251, + "mean_norm/layer16": 10.523910284042358, + "mean_norm/layer17": 10.995957911014557, + "mean_norm/layer18": 10.567832112312317, + "mean_norm/layer19": 10.61269599199295, + "mean_norm/layer2": 8.82736986875534, + "mean_norm/layer20": 10.722554564476013, + "mean_norm/layer21": 10.679236650466919, + "mean_norm/layer22": 11.612319529056549, + "mean_norm/layer23": 11.558498978614807, + "mean_norm/layer3": 11.032294690608978, + "mean_norm/layer4": 9.93044263124466, + "mean_norm/layer5": 12.167267978191376, + "mean_norm/layer6": 9.479266583919525, + "mean_norm/layer7": 9.972204864025116, + "mean_norm/layer8": 10.429711878299713, + "mean_norm/layer9": 10.363643407821655, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9100 + }, + { + "epoch": 3.8, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4681252357600905, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6967613697052, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8279, + "eval_samples_per_second": 20.376, + "eval_steps_per_second": 0.676, + "step": 9100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.82, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5825, + "max_norm": 32.35498046875, + "max_norm/layer0": 25.00909996032715, + "max_norm/layer1": 26.24652862548828, + "max_norm/layer10": 27.876937866210938, + "max_norm/layer11": 26.062362670898438, + "max_norm/layer12": 28.732330322265625, + "max_norm/layer13": 24.885143280029297, + "max_norm/layer14": 26.589519500732422, + "max_norm/layer15": 31.518461227416992, + "max_norm/layer16": 26.398515701293945, + "max_norm/layer17": 31.479341506958008, + "max_norm/layer18": 27.692447662353516, + "max_norm/layer19": 27.19039535522461, + "max_norm/layer2": 20.811538696289062, + "max_norm/layer20": 28.179485321044922, + "max_norm/layer21": 27.66974639892578, + "max_norm/layer22": 28.55803108215332, + "max_norm/layer23": 27.369035720825195, + "max_norm/layer3": 25.627965927124023, + "max_norm/layer4": 25.377857208251953, + "max_norm/layer5": 32.35498046875, + "max_norm/layer6": 21.744564056396484, + "max_norm/layer7": 27.417688369750977, + "max_norm/layer8": 27.45230484008789, + "max_norm/layer9": 27.24327278137207, + "mean_norm": 10.617767485479513, + "mean_norm/layer0": 10.20370638370514, + "mean_norm/layer1": 10.105073094367981, + "mean_norm/layer10": 10.461777687072754, + "mean_norm/layer11": 10.758564233779907, + "mean_norm/layer12": 11.263149619102478, + "mean_norm/layer13": 10.447303175926208, + "mean_norm/layer14": 10.823521196842194, + "mean_norm/layer15": 11.131090462207794, + "mean_norm/layer16": 10.533623218536377, + "mean_norm/layer17": 11.006788909435272, + "mean_norm/layer18": 10.576985120773315, + "mean_norm/layer19": 10.621982991695404, + "mean_norm/layer2": 8.830790042877197, + "mean_norm/layer20": 10.73173063993454, + "mean_norm/layer21": 10.688687920570374, + "mean_norm/layer22": 11.625361859798431, + "mean_norm/layer23": 11.57146829366684, + "mean_norm/layer3": 11.044941544532776, + "mean_norm/layer4": 9.938095211982727, + "mean_norm/layer5": 12.18439656496048, + "mean_norm/layer6": 9.485150754451752, + "mean_norm/layer7": 9.980055332183838, + "mean_norm/layer8": 10.43933492898941, + "mean_norm/layer9": 10.372840464115143, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9150 + }, + { + "epoch": 3.82, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4689972945895848, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.69665265083313, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8286, + "eval_samples_per_second": 20.374, + "eval_steps_per_second": 0.676, + "step": 9150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.84, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.58, + "max_norm": 32.470787048339844, + "max_norm/layer0": 25.096399307250977, + "max_norm/layer1": 26.337860107421875, + "max_norm/layer10": 27.961523056030273, + "max_norm/layer11": 26.16880989074707, + "max_norm/layer12": 28.851654052734375, + "max_norm/layer13": 24.98517608642578, + "max_norm/layer14": 26.683137893676758, + "max_norm/layer15": 31.63360023498535, + "max_norm/layer16": 26.46404457092285, + "max_norm/layer17": 31.591623306274414, + "max_norm/layer18": 27.78776741027832, + "max_norm/layer19": 27.291912078857422, + "max_norm/layer2": 20.879919052124023, + "max_norm/layer20": 28.259227752685547, + "max_norm/layer21": 27.76218605041504, + "max_norm/layer22": 28.638896942138672, + "max_norm/layer23": 27.45287322998047, + "max_norm/layer3": 25.71695899963379, + "max_norm/layer4": 25.455402374267578, + "max_norm/layer5": 32.470787048339844, + "max_norm/layer6": 21.793964385986328, + "max_norm/layer7": 27.533058166503906, + "max_norm/layer8": 27.53644561767578, + "max_norm/layer9": 27.302696228027344, + "mean_norm": 10.627832487225533, + "mean_norm/layer0": 10.215189158916473, + "mean_norm/layer1": 10.114474654197693, + "mean_norm/layer10": 10.471054553985596, + "mean_norm/layer11": 10.768976330757141, + "mean_norm/layer12": 11.276058495044708, + "mean_norm/layer13": 10.456969678401947, + "mean_norm/layer14": 10.834083795547485, + "mean_norm/layer15": 11.143160045146942, + "mean_norm/layer16": 10.543258905410767, + "mean_norm/layer17": 11.017536640167236, + "mean_norm/layer18": 10.586021959781647, + "mean_norm/layer19": 10.631254851818085, + "mean_norm/layer2": 8.834143280982971, + "mean_norm/layer20": 10.741076946258545, + "mean_norm/layer21": 10.698038101196289, + "mean_norm/layer22": 11.63832575082779, + "mean_norm/layer23": 11.584293246269226, + "mean_norm/layer3": 11.057526648044586, + "mean_norm/layer4": 9.945752322673798, + "mean_norm/layer5": 12.201387524604797, + "mean_norm/layer6": 9.490907371044159, + "mean_norm/layer7": 9.987753689289093, + "mean_norm/layer8": 10.448831021785736, + "mean_norm/layer9": 10.38190472126007, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9200 + }, + { + "epoch": 3.84, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4678656461550318, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.699800729751587, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6274, + "eval_samples_per_second": 20.727, + "eval_steps_per_second": 0.688, + "step": 9200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.86, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5811, + "max_norm": 32.58055877685547, + "max_norm/layer0": 25.184913635253906, + "max_norm/layer1": 26.429561614990234, + "max_norm/layer10": 28.046606063842773, + "max_norm/layer11": 26.280040740966797, + "max_norm/layer12": 28.957191467285156, + "max_norm/layer13": 25.079774856567383, + "max_norm/layer14": 26.769201278686523, + "max_norm/layer15": 31.73074722290039, + "max_norm/layer16": 26.54261589050293, + "max_norm/layer17": 31.711532592773438, + "max_norm/layer18": 27.88140869140625, + "max_norm/layer19": 27.393001556396484, + "max_norm/layer2": 20.94183921813965, + "max_norm/layer20": 28.350820541381836, + "max_norm/layer21": 27.87078285217285, + "max_norm/layer22": 28.729032516479492, + "max_norm/layer23": 27.542428970336914, + "max_norm/layer3": 25.806852340698242, + "max_norm/layer4": 25.527923583984375, + "max_norm/layer5": 32.58055877685547, + "max_norm/layer6": 21.839183807373047, + "max_norm/layer7": 27.622976303100586, + "max_norm/layer8": 27.621929168701172, + "max_norm/layer9": 27.380239486694336, + "mean_norm": 10.637928095956644, + "mean_norm/layer0": 10.226729273796082, + "mean_norm/layer1": 10.123919010162354, + "mean_norm/layer10": 10.480370283126831, + "mean_norm/layer11": 10.779435157775879, + "mean_norm/layer12": 11.289127767086029, + "mean_norm/layer13": 10.466708064079285, + "mean_norm/layer14": 10.844647407531738, + "mean_norm/layer15": 11.155323445796967, + "mean_norm/layer16": 10.55289614200592, + "mean_norm/layer17": 11.028343617916107, + "mean_norm/layer18": 10.595082998275757, + "mean_norm/layer19": 10.640502452850342, + "mean_norm/layer2": 8.8375204205513, + "mean_norm/layer20": 10.750492691993713, + "mean_norm/layer21": 10.707438945770264, + "mean_norm/layer22": 11.651351392269135, + "mean_norm/layer23": 11.597171068191528, + "mean_norm/layer3": 11.070042908191681, + "mean_norm/layer4": 9.953387081623077, + "mean_norm/layer5": 12.218364238739014, + "mean_norm/layer6": 9.496791005134583, + "mean_norm/layer7": 9.995419442653656, + "mean_norm/layer8": 10.458230197429657, + "mean_norm/layer9": 10.390979290008545, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9250 + }, + { + "epoch": 3.86, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46845783494157206, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.69732403755188, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.7995, + "eval_samples_per_second": 22.316, + "eval_steps_per_second": 0.741, + "step": 9250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.88, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5798, + "max_norm": 32.68303298950195, + "max_norm/layer0": 25.272388458251953, + "max_norm/layer1": 26.51814079284668, + "max_norm/layer10": 28.143573760986328, + "max_norm/layer11": 26.36440658569336, + "max_norm/layer12": 29.06740379333496, + "max_norm/layer13": 25.197477340698242, + "max_norm/layer14": 26.863147735595703, + "max_norm/layer15": 31.821640014648438, + "max_norm/layer16": 26.632102966308594, + "max_norm/layer17": 31.83808708190918, + "max_norm/layer18": 27.988380432128906, + "max_norm/layer19": 27.489473342895508, + "max_norm/layer2": 21.011850357055664, + "max_norm/layer20": 28.4365291595459, + "max_norm/layer21": 27.981365203857422, + "max_norm/layer22": 28.814743041992188, + "max_norm/layer23": 27.636215209960938, + "max_norm/layer3": 25.881065368652344, + "max_norm/layer4": 25.616458892822266, + "max_norm/layer5": 32.68303298950195, + "max_norm/layer6": 21.897836685180664, + "max_norm/layer7": 27.713808059692383, + "max_norm/layer8": 27.703105926513672, + "max_norm/layer9": 27.458404541015625, + "mean_norm": 10.647937004764875, + "mean_norm/layer0": 10.238056540489197, + "mean_norm/layer1": 10.133143305778503, + "mean_norm/layer10": 10.489564597606659, + "mean_norm/layer11": 10.789824903011322, + "mean_norm/layer12": 11.302159667015076, + "mean_norm/layer13": 10.476322174072266, + "mean_norm/layer14": 10.855113446712494, + "mean_norm/layer15": 11.167461931705475, + "mean_norm/layer16": 10.562495648860931, + "mean_norm/layer17": 11.03900271654129, + "mean_norm/layer18": 10.604086875915527, + "mean_norm/layer19": 10.649737179279327, + "mean_norm/layer2": 8.840841054916382, + "mean_norm/layer20": 10.759805142879486, + "mean_norm/layer21": 10.716701686382294, + "mean_norm/layer22": 11.664154350757599, + "mean_norm/layer23": 11.609936714172363, + "mean_norm/layer3": 11.082544147968292, + "mean_norm/layer4": 9.9610356092453, + "mean_norm/layer5": 12.235257029533386, + "mean_norm/layer6": 9.502565085887909, + "mean_norm/layer7": 10.003019213676453, + "mean_norm/layer8": 10.467623889446259, + "mean_norm/layer9": 10.400035202503204, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9300 + }, + { + "epoch": 3.88, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46830775970114746, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7002856731414795, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8184, + "eval_samples_per_second": 22.277, + "eval_steps_per_second": 0.739, + "step": 9300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.9, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5664, + "max_norm": 32.782840728759766, + "max_norm/layer0": 25.365907669067383, + "max_norm/layer1": 26.609689712524414, + "max_norm/layer10": 28.237533569335938, + "max_norm/layer11": 26.454559326171875, + "max_norm/layer12": 29.165164947509766, + "max_norm/layer13": 25.313295364379883, + "max_norm/layer14": 26.973520278930664, + "max_norm/layer15": 31.91727066040039, + "max_norm/layer16": 26.71632194519043, + "max_norm/layer17": 31.9581241607666, + "max_norm/layer18": 28.106477737426758, + "max_norm/layer19": 27.586517333984375, + "max_norm/layer2": 21.090667724609375, + "max_norm/layer20": 28.518213272094727, + "max_norm/layer21": 28.0922794342041, + "max_norm/layer22": 28.909934997558594, + "max_norm/layer23": 27.714889526367188, + "max_norm/layer3": 25.95438575744629, + "max_norm/layer4": 25.699705123901367, + "max_norm/layer5": 32.782840728759766, + "max_norm/layer6": 21.94924545288086, + "max_norm/layer7": 27.81015968322754, + "max_norm/layer8": 27.77658462524414, + "max_norm/layer9": 27.53354835510254, + "mean_norm": 10.658011309802532, + "mean_norm/layer0": 10.24942147731781, + "mean_norm/layer1": 10.14245593547821, + "mean_norm/layer10": 10.498845994472504, + "mean_norm/layer11": 10.800289332866669, + "mean_norm/layer12": 11.315202176570892, + "mean_norm/layer13": 10.485957622528076, + "mean_norm/layer14": 10.865731239318848, + "mean_norm/layer15": 11.179639279842377, + "mean_norm/layer16": 10.572109937667847, + "mean_norm/layer17": 11.049724102020264, + "mean_norm/layer18": 10.613103151321411, + "mean_norm/layer19": 10.658956408500671, + "mean_norm/layer2": 8.844276249408722, + "mean_norm/layer20": 10.769253730773926, + "mean_norm/layer21": 10.72613674402237, + "mean_norm/layer22": 11.676981389522552, + "mean_norm/layer23": 11.622842133045197, + "mean_norm/layer3": 11.095019221305847, + "mean_norm/layer4": 9.96867686510086, + "mean_norm/layer5": 12.25225579738617, + "mean_norm/layer6": 9.508372902870178, + "mean_norm/layer7": 10.010667264461517, + "mean_norm/layer8": 10.477143466472626, + "mean_norm/layer9": 10.40920901298523, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9350 + }, + { + "epoch": 3.9, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4693461181213825, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6948671340942383, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8372, + "eval_samples_per_second": 20.36, + "eval_steps_per_second": 0.676, + "step": 9350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.92, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5755, + "max_norm": 32.886863708496094, + "max_norm/layer0": 25.44892120361328, + "max_norm/layer1": 26.69940757751465, + "max_norm/layer10": 28.33182144165039, + "max_norm/layer11": 26.536706924438477, + "max_norm/layer12": 29.27495002746582, + "max_norm/layer13": 25.407133102416992, + "max_norm/layer14": 27.068056106567383, + "max_norm/layer15": 32.01877975463867, + "max_norm/layer16": 26.809919357299805, + "max_norm/layer17": 32.068660736083984, + "max_norm/layer18": 28.212785720825195, + "max_norm/layer19": 27.692922592163086, + "max_norm/layer2": 21.16015625, + "max_norm/layer20": 28.613033294677734, + "max_norm/layer21": 28.182695388793945, + "max_norm/layer22": 29.009483337402344, + "max_norm/layer23": 27.800437927246094, + "max_norm/layer3": 26.028907775878906, + "max_norm/layer4": 25.79058837890625, + "max_norm/layer5": 32.886863708496094, + "max_norm/layer6": 22.01177978515625, + "max_norm/layer7": 27.899147033691406, + "max_norm/layer8": 27.851360321044922, + "max_norm/layer9": 27.61525535583496, + "mean_norm": 10.668005446592966, + "mean_norm/layer0": 10.260759949684143, + "mean_norm/layer1": 10.15172153711319, + "mean_norm/layer10": 10.508157014846802, + "mean_norm/layer11": 10.810645937919617, + "mean_norm/layer12": 11.328147649765015, + "mean_norm/layer13": 10.495525300502777, + "mean_norm/layer14": 10.876251876354218, + "mean_norm/layer15": 11.191632449626923, + "mean_norm/layer16": 10.58162671327591, + "mean_norm/layer17": 11.06039971113205, + "mean_norm/layer18": 10.622076153755188, + "mean_norm/layer19": 10.668111145496368, + "mean_norm/layer2": 8.847656607627869, + "mean_norm/layer20": 10.778528094291687, + "mean_norm/layer21": 10.735529243946075, + "mean_norm/layer22": 11.689706325531006, + "mean_norm/layer23": 11.635596692562103, + "mean_norm/layer3": 11.107528388500214, + "mean_norm/layer4": 9.976164162158966, + "mean_norm/layer5": 12.269051373004913, + "mean_norm/layer6": 9.51415604352951, + "mean_norm/layer7": 10.01818311214447, + "mean_norm/layer8": 10.486587703227997, + "mean_norm/layer9": 10.418387532234192, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9400 + }, + { + "epoch": 3.92, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4681495722855648, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6942684650421143, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6432, + "eval_samples_per_second": 20.699, + "eval_steps_per_second": 0.687, + "step": 9400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.95, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.573, + "max_norm": 33.00111389160156, + "max_norm/layer0": 25.53734016418457, + "max_norm/layer1": 26.78814125061035, + "max_norm/layer10": 28.42632293701172, + "max_norm/layer11": 26.61481475830078, + "max_norm/layer12": 29.382888793945312, + "max_norm/layer13": 25.50127601623535, + "max_norm/layer14": 27.171720504760742, + "max_norm/layer15": 32.12615966796875, + "max_norm/layer16": 26.910057067871094, + "max_norm/layer17": 32.16920852661133, + "max_norm/layer18": 28.307641983032227, + "max_norm/layer19": 27.791166305541992, + "max_norm/layer2": 21.225391387939453, + "max_norm/layer20": 28.681900024414062, + "max_norm/layer21": 28.29361915588379, + "max_norm/layer22": 29.12259292602539, + "max_norm/layer23": 27.881290435791016, + "max_norm/layer3": 26.104650497436523, + "max_norm/layer4": 25.875703811645508, + "max_norm/layer5": 33.00111389160156, + "max_norm/layer6": 22.065937042236328, + "max_norm/layer7": 28.001384735107422, + "max_norm/layer8": 27.930898666381836, + "max_norm/layer9": 27.698144912719727, + "mean_norm": 10.67796295384566, + "mean_norm/layer0": 10.27203243970871, + "mean_norm/layer1": 10.161053121089935, + "mean_norm/layer10": 10.51726907491684, + "mean_norm/layer11": 10.820999085903168, + "mean_norm/layer12": 11.341056287288666, + "mean_norm/layer13": 10.505224525928497, + "mean_norm/layer14": 10.886779367923737, + "mean_norm/layer15": 11.20365023612976, + "mean_norm/layer16": 10.591172337532043, + "mean_norm/layer17": 11.071096956729889, + "mean_norm/layer18": 10.631023526191711, + "mean_norm/layer19": 10.677245795726776, + "mean_norm/layer2": 8.850984394550323, + "mean_norm/layer20": 10.787645399570465, + "mean_norm/layer21": 10.744815289974213, + "mean_norm/layer22": 11.702471911907196, + "mean_norm/layer23": 11.648136258125305, + "mean_norm/layer3": 11.11998337507248, + "mean_norm/layer4": 9.983684122562408, + "mean_norm/layer5": 12.285788357257843, + "mean_norm/layer6": 9.519932866096497, + "mean_norm/layer7": 10.02573847770691, + "mean_norm/layer8": 10.495937168598175, + "mean_norm/layer9": 10.42739051580429, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9450 + }, + { + "epoch": 3.95, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4690256872026381, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6952497959136963, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.846, + "eval_samples_per_second": 20.344, + "eval_steps_per_second": 0.675, + "step": 9450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.97, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5826, + "max_norm": 33.11233139038086, + "max_norm/layer0": 25.61636734008789, + "max_norm/layer1": 26.879316329956055, + "max_norm/layer10": 28.511680603027344, + "max_norm/layer11": 26.70820426940918, + "max_norm/layer12": 29.474576950073242, + "max_norm/layer13": 25.595924377441406, + "max_norm/layer14": 27.25803565979004, + "max_norm/layer15": 32.24443817138672, + "max_norm/layer16": 27.010766983032227, + "max_norm/layer17": 32.268558502197266, + "max_norm/layer18": 28.439178466796875, + "max_norm/layer19": 27.8987979888916, + "max_norm/layer2": 21.282726287841797, + "max_norm/layer20": 28.772045135498047, + "max_norm/layer21": 28.373287200927734, + "max_norm/layer22": 29.23287010192871, + "max_norm/layer23": 27.96897315979004, + "max_norm/layer3": 26.182008743286133, + "max_norm/layer4": 25.959827423095703, + "max_norm/layer5": 33.11233139038086, + "max_norm/layer6": 22.129119873046875, + "max_norm/layer7": 28.099084854125977, + "max_norm/layer8": 28.009950637817383, + "max_norm/layer9": 27.775909423828125, + "mean_norm": 10.688044652342796, + "mean_norm/layer0": 10.283402860164642, + "mean_norm/layer1": 10.17039829492569, + "mean_norm/layer10": 10.52660220861435, + "mean_norm/layer11": 10.831436216831207, + "mean_norm/layer12": 11.354080498218536, + "mean_norm/layer13": 10.514998495578766, + "mean_norm/layer14": 10.89742910861969, + "mean_norm/layer15": 11.215672731399536, + "mean_norm/layer16": 10.600797593593597, + "mean_norm/layer17": 11.081857025623322, + "mean_norm/layer18": 10.640068292617798, + "mean_norm/layer19": 10.686591744422913, + "mean_norm/layer2": 8.854361951351166, + "mean_norm/layer20": 10.796972274780273, + "mean_norm/layer21": 10.754287958145142, + "mean_norm/layer22": 11.71543425321579, + "mean_norm/layer23": 11.660886287689209, + "mean_norm/layer3": 11.13255774974823, + "mean_norm/layer4": 9.991296291351318, + "mean_norm/layer5": 12.302757441997528, + "mean_norm/layer6": 9.525744915008545, + "mean_norm/layer7": 10.033455848693848, + "mean_norm/layer8": 10.505375623703003, + "mean_norm/layer9": 10.436605989933014, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9500 + }, + { + "epoch": 3.97, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46980445601781434, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6896309852600098, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6117, + "eval_samples_per_second": 20.755, + "eval_steps_per_second": 0.689, + "step": 9500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 3.99, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5845, + "max_norm": 33.22111511230469, + "max_norm/layer0": 25.70020866394043, + "max_norm/layer1": 26.959239959716797, + "max_norm/layer10": 28.604167938232422, + "max_norm/layer11": 26.803647994995117, + "max_norm/layer12": 29.598041534423828, + "max_norm/layer13": 25.70684051513672, + "max_norm/layer14": 27.33949851989746, + "max_norm/layer15": 32.35847473144531, + "max_norm/layer16": 27.094337463378906, + "max_norm/layer17": 32.37206268310547, + "max_norm/layer18": 28.551963806152344, + "max_norm/layer19": 28.00347900390625, + "max_norm/layer2": 21.350160598754883, + "max_norm/layer20": 28.8660888671875, + "max_norm/layer21": 28.463394165039062, + "max_norm/layer22": 29.33779525756836, + "max_norm/layer23": 28.057477951049805, + "max_norm/layer3": 26.272552490234375, + "max_norm/layer4": 26.05592155456543, + "max_norm/layer5": 33.22111511230469, + "max_norm/layer6": 22.20157814025879, + "max_norm/layer7": 28.201513290405273, + "max_norm/layer8": 28.098514556884766, + "max_norm/layer9": 27.844715118408203, + "mean_norm": 10.698029942810535, + "mean_norm/layer0": 10.294709742069244, + "mean_norm/layer1": 10.179706275463104, + "mean_norm/layer10": 10.535793900489807, + "mean_norm/layer11": 10.841690242290497, + "mean_norm/layer12": 11.367003858089447, + "mean_norm/layer13": 10.524603307247162, + "mean_norm/layer14": 10.90799218416214, + "mean_norm/layer15": 11.227812469005585, + "mean_norm/layer16": 10.610308766365051, + "mean_norm/layer17": 11.092499136924744, + "mean_norm/layer18": 10.648983716964722, + "mean_norm/layer19": 10.695793569087982, + "mean_norm/layer2": 8.85766851902008, + "mean_norm/layer20": 10.806212484836578, + "mean_norm/layer21": 10.76362019777298, + "mean_norm/layer22": 11.728101670742035, + "mean_norm/layer23": 11.673562049865723, + "mean_norm/layer3": 11.145098149776459, + "mean_norm/layer4": 9.99885606765747, + "mean_norm/layer5": 12.319611668586731, + "mean_norm/layer6": 9.53151524066925, + "mean_norm/layer7": 10.041094720363617, + "mean_norm/layer8": 10.514805734157562, + "mean_norm/layer9": 10.44567495584488, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9550 + }, + { + "epoch": 3.99, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4687012001963146, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6940293312072754, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8271, + "eval_samples_per_second": 20.377, + "eval_steps_per_second": 0.676, + "step": 9550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.01, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5008, + "max_norm": 33.330360412597656, + "max_norm/layer0": 25.78761100769043, + "max_norm/layer1": 27.03449821472168, + "max_norm/layer10": 28.674245834350586, + "max_norm/layer11": 26.880537033081055, + "max_norm/layer12": 29.694679260253906, + "max_norm/layer13": 25.82834243774414, + "max_norm/layer14": 27.425241470336914, + "max_norm/layer15": 32.486995697021484, + "max_norm/layer16": 27.171628952026367, + "max_norm/layer17": 32.492279052734375, + "max_norm/layer18": 28.64808464050293, + "max_norm/layer19": 28.095623016357422, + "max_norm/layer2": 21.42145347595215, + "max_norm/layer20": 28.951364517211914, + "max_norm/layer21": 28.559009552001953, + "max_norm/layer22": 29.44493865966797, + "max_norm/layer23": 28.142528533935547, + "max_norm/layer3": 26.364864349365234, + "max_norm/layer4": 26.138946533203125, + "max_norm/layer5": 33.330360412597656, + "max_norm/layer6": 22.253427505493164, + "max_norm/layer7": 28.289306640625, + "max_norm/layer8": 28.16522789001465, + "max_norm/layer9": 27.91402244567871, + "mean_norm": 10.707975409924984, + "mean_norm/layer0": 10.30594515800476, + "mean_norm/layer1": 10.188912451267242, + "mean_norm/layer10": 10.544912993907928, + "mean_norm/layer11": 10.851902425289154, + "mean_norm/layer12": 11.379847884178162, + "mean_norm/layer13": 10.534163355827332, + "mean_norm/layer14": 10.918485581874847, + "mean_norm/layer15": 11.239793062210083, + "mean_norm/layer16": 10.619805216789246, + "mean_norm/layer17": 11.103209257125854, + "mean_norm/layer18": 10.657873153686523, + "mean_norm/layer19": 10.705002188682556, + "mean_norm/layer2": 8.860992550849915, + "mean_norm/layer20": 10.81546437740326, + "mean_norm/layer21": 10.773070752620697, + "mean_norm/layer22": 11.740694344043732, + "mean_norm/layer23": 11.686245620250702, + "mean_norm/layer3": 11.157555222511292, + "mean_norm/layer4": 10.006467998027802, + "mean_norm/layer5": 12.33630108833313, + "mean_norm/layer6": 9.53725254535675, + "mean_norm/layer7": 10.04867398738861, + "mean_norm/layer8": 10.52416044473648, + "mean_norm/layer9": 10.454678177833557, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9600 + }, + { + "epoch": 4.01, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46611747240846424, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.72489857673645, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5754, + "eval_samples_per_second": 20.82, + "eval_steps_per_second": 0.691, + "step": 9600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.03, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3794, + "max_norm": 33.43217468261719, + "max_norm/layer0": 25.877573013305664, + "max_norm/layer1": 27.117990493774414, + "max_norm/layer10": 28.741506576538086, + "max_norm/layer11": 26.964374542236328, + "max_norm/layer12": 29.798730850219727, + "max_norm/layer13": 25.944913864135742, + "max_norm/layer14": 27.508432388305664, + "max_norm/layer15": 32.604679107666016, + "max_norm/layer16": 27.249217987060547, + "max_norm/layer17": 32.60658645629883, + "max_norm/layer18": 28.736671447753906, + "max_norm/layer19": 28.200363159179688, + "max_norm/layer2": 21.477174758911133, + "max_norm/layer20": 29.063146591186523, + "max_norm/layer21": 28.660245895385742, + "max_norm/layer22": 29.5419979095459, + "max_norm/layer23": 28.22159767150879, + "max_norm/layer3": 26.45147705078125, + "max_norm/layer4": 26.22504425048828, + "max_norm/layer5": 33.43217468261719, + "max_norm/layer6": 22.306541442871094, + "max_norm/layer7": 28.394588470458984, + "max_norm/layer8": 28.237964630126953, + "max_norm/layer9": 28.015945434570312, + "mean_norm": 10.718371979892254, + "mean_norm/layer0": 10.31786572933197, + "mean_norm/layer1": 10.19822359085083, + "mean_norm/layer10": 10.554284036159515, + "mean_norm/layer11": 10.862599432468414, + "mean_norm/layer12": 11.393266081809998, + "mean_norm/layer13": 10.544181823730469, + "mean_norm/layer14": 10.929447948932648, + "mean_norm/layer15": 11.252337992191315, + "mean_norm/layer16": 10.629814624786377, + "mean_norm/layer17": 11.114417672157288, + "mean_norm/layer18": 10.667439937591553, + "mean_norm/layer19": 10.715016543865204, + "mean_norm/layer2": 8.864496111869812, + "mean_norm/layer20": 10.825547099113464, + "mean_norm/layer21": 10.783361256122589, + "mean_norm/layer22": 11.753725469112396, + "mean_norm/layer23": 11.699581742286682, + "mean_norm/layer3": 11.170176565647125, + "mean_norm/layer4": 10.014464855194092, + "mean_norm/layer5": 12.353192925453186, + "mean_norm/layer6": 9.543238639831543, + "mean_norm/layer7": 10.056542873382568, + "mean_norm/layer8": 10.533743023872375, + "mean_norm/layer9": 10.46396154165268, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9650 + }, + { + "epoch": 4.03, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4661945380724661, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7255403995513916, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8304, + "eval_samples_per_second": 20.371, + "eval_steps_per_second": 0.676, + "step": 9650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.05, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4052, + "max_norm": 33.544166564941406, + "max_norm/layer0": 25.971208572387695, + "max_norm/layer1": 27.212482452392578, + "max_norm/layer10": 28.805835723876953, + "max_norm/layer11": 27.037063598632812, + "max_norm/layer12": 29.901081085205078, + "max_norm/layer13": 26.061325073242188, + "max_norm/layer14": 27.592479705810547, + "max_norm/layer15": 32.70225143432617, + "max_norm/layer16": 27.345638275146484, + "max_norm/layer17": 32.72298812866211, + "max_norm/layer18": 28.8302059173584, + "max_norm/layer19": 28.301692962646484, + "max_norm/layer2": 21.534664154052734, + "max_norm/layer20": 29.158594131469727, + "max_norm/layer21": 28.769094467163086, + "max_norm/layer22": 29.628246307373047, + "max_norm/layer23": 28.29683494567871, + "max_norm/layer3": 26.550901412963867, + "max_norm/layer4": 26.31060791015625, + "max_norm/layer5": 33.544166564941406, + "max_norm/layer6": 22.365896224975586, + "max_norm/layer7": 28.48600959777832, + "max_norm/layer8": 28.317893981933594, + "max_norm/layer9": 28.098060607910156, + "mean_norm": 10.72877743591865, + "mean_norm/layer0": 10.33024138212204, + "mean_norm/layer1": 10.20755660533905, + "mean_norm/layer10": 10.56365418434143, + "mean_norm/layer11": 10.873272597789764, + "mean_norm/layer12": 11.406682074069977, + "mean_norm/layer13": 10.554228723049164, + "mean_norm/layer14": 10.94050520658493, + "mean_norm/layer15": 11.2648805975914, + "mean_norm/layer16": 10.639814674854279, + "mean_norm/layer17": 11.125602781772614, + "mean_norm/layer18": 10.67691570520401, + "mean_norm/layer19": 10.724987506866455, + "mean_norm/layer2": 8.8680060505867, + "mean_norm/layer20": 10.835620880126953, + "mean_norm/layer21": 10.793499529361725, + "mean_norm/layer22": 11.766671538352966, + "mean_norm/layer23": 11.71286165714264, + "mean_norm/layer3": 11.1830073595047, + "mean_norm/layer4": 10.02237868309021, + "mean_norm/layer5": 12.3701092004776, + "mean_norm/layer6": 9.549232542514801, + "mean_norm/layer7": 10.064398467540741, + "mean_norm/layer8": 10.54334545135498, + "mean_norm/layer9": 10.473185062408447, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9700 + }, + { + "epoch": 4.05, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46593089237982827, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7316884994506836, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8212, + "eval_samples_per_second": 20.387, + "eval_steps_per_second": 0.677, + "step": 9700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.07, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4048, + "max_norm": 33.6557731628418, + "max_norm/layer0": 26.066650390625, + "max_norm/layer1": 27.306856155395508, + "max_norm/layer10": 28.87506675720215, + "max_norm/layer11": 27.117992401123047, + "max_norm/layer12": 30.010032653808594, + "max_norm/layer13": 26.163286209106445, + "max_norm/layer14": 27.68418312072754, + "max_norm/layer15": 32.824462890625, + "max_norm/layer16": 27.442707061767578, + "max_norm/layer17": 32.84294128417969, + "max_norm/layer18": 28.918869018554688, + "max_norm/layer19": 28.40460205078125, + "max_norm/layer2": 21.58877182006836, + "max_norm/layer20": 29.261137008666992, + "max_norm/layer21": 28.882108688354492, + "max_norm/layer22": 29.714868545532227, + "max_norm/layer23": 28.384431838989258, + "max_norm/layer3": 26.648792266845703, + "max_norm/layer4": 26.3952693939209, + "max_norm/layer5": 33.6557731628418, + "max_norm/layer6": 22.42438316345215, + "max_norm/layer7": 28.574481964111328, + "max_norm/layer8": 28.396562576293945, + "max_norm/layer9": 28.194005966186523, + "mean_norm": 10.739245263238749, + "mean_norm/layer0": 10.34294319152832, + "mean_norm/layer1": 10.216990768909454, + "mean_norm/layer10": 10.573124587535858, + "mean_norm/layer11": 10.884048283100128, + "mean_norm/layer12": 11.420178711414337, + "mean_norm/layer13": 10.56421959400177, + "mean_norm/layer14": 10.95153260231018, + "mean_norm/layer15": 11.277423799037933, + "mean_norm/layer16": 10.649728536605835, + "mean_norm/layer17": 11.136787831783295, + "mean_norm/layer18": 10.686513543128967, + "mean_norm/layer19": 10.735000014305115, + "mean_norm/layer2": 8.871544182300568, + "mean_norm/layer20": 10.845619082450867, + "mean_norm/layer21": 10.803569555282593, + "mean_norm/layer22": 11.779800772666931, + "mean_norm/layer23": 11.72627604007721, + "mean_norm/layer3": 11.19598013162613, + "mean_norm/layer4": 10.030231535434723, + "mean_norm/layer5": 12.387197315692902, + "mean_norm/layer6": 9.555224657058716, + "mean_norm/layer7": 10.072312891483307, + "mean_norm/layer8": 10.552999079227448, + "mean_norm/layer9": 10.482639610767365, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9750 + }, + { + "epoch": 4.07, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4651399553019149, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.731163501739502, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6326, + "eval_samples_per_second": 20.718, + "eval_steps_per_second": 0.688, + "step": 9750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.09, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.431, + "max_norm": 33.754417419433594, + "max_norm/layer0": 26.159645080566406, + "max_norm/layer1": 27.404632568359375, + "max_norm/layer10": 28.946714401245117, + "max_norm/layer11": 27.202007293701172, + "max_norm/layer12": 30.121065139770508, + "max_norm/layer13": 26.25760841369629, + "max_norm/layer14": 27.78693389892578, + "max_norm/layer15": 32.94147872924805, + "max_norm/layer16": 27.53252601623535, + "max_norm/layer17": 32.94584274291992, + "max_norm/layer18": 29.010591506958008, + "max_norm/layer19": 28.501497268676758, + "max_norm/layer2": 21.647987365722656, + "max_norm/layer20": 29.359277725219727, + "max_norm/layer21": 28.98589515686035, + "max_norm/layer22": 29.815181732177734, + "max_norm/layer23": 28.46575927734375, + "max_norm/layer3": 26.744037628173828, + "max_norm/layer4": 26.49158477783203, + "max_norm/layer5": 33.754417419433594, + "max_norm/layer6": 22.48211097717285, + "max_norm/layer7": 28.680606842041016, + "max_norm/layer8": 28.470558166503906, + "max_norm/layer9": 28.30710220336914, + "mean_norm": 10.749750765661398, + "mean_norm/layer0": 10.355877697467804, + "mean_norm/layer1": 10.226464807987213, + "mean_norm/layer10": 10.582582950592041, + "mean_norm/layer11": 10.894802331924438, + "mean_norm/layer12": 11.433715283870697, + "mean_norm/layer13": 10.574375629425049, + "mean_norm/layer14": 10.96265333890915, + "mean_norm/layer15": 11.29006689786911, + "mean_norm/layer16": 10.659694969654083, + "mean_norm/layer17": 11.147985517978668, + "mean_norm/layer18": 10.696076333522797, + "mean_norm/layer19": 10.744998633861542, + "mean_norm/layer2": 8.87516975402832, + "mean_norm/layer20": 10.855427503585815, + "mean_norm/layer21": 10.813684225082397, + "mean_norm/layer22": 11.792862176895142, + "mean_norm/layer23": 11.739510834217072, + "mean_norm/layer3": 11.209203958511353, + "mean_norm/layer4": 10.038220882415771, + "mean_norm/layer5": 12.404386818408966, + "mean_norm/layer6": 9.561310589313507, + "mean_norm/layer7": 10.080223083496094, + "mean_norm/layer8": 10.56266450881958, + "mean_norm/layer9": 10.492059648036957, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9800 + }, + { + "epoch": 4.09, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4648844217844352, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.733736276626587, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8593, + "eval_samples_per_second": 20.322, + "eval_steps_per_second": 0.675, + "step": 9800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.11, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4228, + "max_norm": 33.861244201660156, + "max_norm/layer0": 26.24639320373535, + "max_norm/layer1": 27.48942756652832, + "max_norm/layer10": 29.03034019470215, + "max_norm/layer11": 27.291231155395508, + "max_norm/layer12": 30.230600357055664, + "max_norm/layer13": 26.365447998046875, + "max_norm/layer14": 27.9014835357666, + "max_norm/layer15": 33.083675384521484, + "max_norm/layer16": 27.63498878479004, + "max_norm/layer17": 33.05691909790039, + "max_norm/layer18": 29.120906829833984, + "max_norm/layer19": 28.622779846191406, + "max_norm/layer2": 21.700437545776367, + "max_norm/layer20": 29.4544734954834, + "max_norm/layer21": 29.081451416015625, + "max_norm/layer22": 29.90110206604004, + "max_norm/layer23": 28.563703536987305, + "max_norm/layer3": 26.82892417907715, + "max_norm/layer4": 26.564434051513672, + "max_norm/layer5": 33.861244201660156, + "max_norm/layer6": 22.549427032470703, + "max_norm/layer7": 28.77765655517578, + "max_norm/layer8": 28.5548152923584, + "max_norm/layer9": 28.40509605407715, + "mean_norm": 10.760287982722124, + "mean_norm/layer0": 10.368937730789185, + "mean_norm/layer1": 10.236066102981567, + "mean_norm/layer10": 10.592142224311829, + "mean_norm/layer11": 10.905653715133667, + "mean_norm/layer12": 11.44727337360382, + "mean_norm/layer13": 10.584530711174011, + "mean_norm/layer14": 10.973800659179688, + "mean_norm/layer15": 11.30276346206665, + "mean_norm/layer16": 10.669570624828339, + "mean_norm/layer17": 11.159093022346497, + "mean_norm/layer18": 10.705552816390991, + "mean_norm/layer19": 10.755048036575317, + "mean_norm/layer2": 8.878891050815582, + "mean_norm/layer20": 10.865257143974304, + "mean_norm/layer21": 10.82360953092575, + "mean_norm/layer22": 11.805942714214325, + "mean_norm/layer23": 11.752815186977386, + "mean_norm/layer3": 11.2224680185318, + "mean_norm/layer4": 10.046254456043243, + "mean_norm/layer5": 12.421765625476837, + "mean_norm/layer6": 9.567421734333038, + "mean_norm/layer7": 10.08821588754654, + "mean_norm/layer8": 10.572381436824799, + "mean_norm/layer9": 10.501456320285797, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9850 + }, + { + "epoch": 4.11, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46495743136085793, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.736454963684082, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6254, + "eval_samples_per_second": 20.731, + "eval_steps_per_second": 0.688, + "step": 9850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.13, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4248, + "max_norm": 33.9556770324707, + "max_norm/layer0": 26.33261489868164, + "max_norm/layer1": 27.56793785095215, + "max_norm/layer10": 29.119720458984375, + "max_norm/layer11": 27.357046127319336, + "max_norm/layer12": 30.328794479370117, + "max_norm/layer13": 26.464094161987305, + "max_norm/layer14": 28.015090942382812, + "max_norm/layer15": 33.20350646972656, + "max_norm/layer16": 27.721712112426758, + "max_norm/layer17": 33.16472244262695, + "max_norm/layer18": 29.199329376220703, + "max_norm/layer19": 28.717470169067383, + "max_norm/layer2": 21.774988174438477, + "max_norm/layer20": 29.529516220092773, + "max_norm/layer21": 29.168851852416992, + "max_norm/layer22": 29.998376846313477, + "max_norm/layer23": 28.664161682128906, + "max_norm/layer3": 26.9122371673584, + "max_norm/layer4": 26.651660919189453, + "max_norm/layer5": 33.9556770324707, + "max_norm/layer6": 22.61054801940918, + "max_norm/layer7": 28.86550521850586, + "max_norm/layer8": 28.6397705078125, + "max_norm/layer9": 28.507871627807617, + "mean_norm": 10.770872302353382, + "mean_norm/layer0": 10.382256388664246, + "mean_norm/layer1": 10.245670199394226, + "mean_norm/layer10": 10.601735293865204, + "mean_norm/layer11": 10.916560173034668, + "mean_norm/layer12": 11.46084600687027, + "mean_norm/layer13": 10.594715774059296, + "mean_norm/layer14": 10.984999299049377, + "mean_norm/layer15": 11.315381169319153, + "mean_norm/layer16": 10.679502785205841, + "mean_norm/layer17": 11.17024689912796, + "mean_norm/layer18": 10.714980006217957, + "mean_norm/layer19": 10.764934778213501, + "mean_norm/layer2": 8.882648348808289, + "mean_norm/layer20": 10.875350773334503, + "mean_norm/layer21": 10.833550810813904, + "mean_norm/layer22": 11.81899881362915, + "mean_norm/layer23": 11.766067922115326, + "mean_norm/layer3": 11.235760807991028, + "mean_norm/layer4": 10.05432653427124, + "mean_norm/layer5": 12.439239859580994, + "mean_norm/layer6": 9.573659777641296, + "mean_norm/layer7": 10.096255362033844, + "mean_norm/layer8": 10.582192361354828, + "mean_norm/layer9": 10.51105511188507, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9900 + }, + { + "epoch": 4.13, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4645396543402165, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7372591495513916, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6883, + "eval_samples_per_second": 20.619, + "eval_steps_per_second": 0.684, + "step": 9900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.15, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4436, + "max_norm": 34.049339294433594, + "max_norm/layer0": 26.419641494750977, + "max_norm/layer1": 27.664649963378906, + "max_norm/layer10": 29.210588455200195, + "max_norm/layer11": 27.431074142456055, + "max_norm/layer12": 30.43071937561035, + "max_norm/layer13": 26.566423416137695, + "max_norm/layer14": 28.112030029296875, + "max_norm/layer15": 33.33354187011719, + "max_norm/layer16": 27.804418563842773, + "max_norm/layer17": 33.27605438232422, + "max_norm/layer18": 29.307640075683594, + "max_norm/layer19": 28.8117733001709, + "max_norm/layer2": 21.834720611572266, + "max_norm/layer20": 29.619890213012695, + "max_norm/layer21": 29.266197204589844, + "max_norm/layer22": 30.08498764038086, + "max_norm/layer23": 28.764848709106445, + "max_norm/layer3": 26.997285842895508, + "max_norm/layer4": 26.735742568969727, + "max_norm/layer5": 34.049339294433594, + "max_norm/layer6": 22.67427635192871, + "max_norm/layer7": 28.954214096069336, + "max_norm/layer8": 28.72142791748047, + "max_norm/layer9": 28.615943908691406, + "mean_norm": 10.781430753568808, + "mean_norm/layer0": 10.395660698413849, + "mean_norm/layer1": 10.255378246307373, + "mean_norm/layer10": 10.61120194196701, + "mean_norm/layer11": 10.9274360537529, + "mean_norm/layer12": 11.474487781524658, + "mean_norm/layer13": 10.604840219020844, + "mean_norm/layer14": 10.996111154556274, + "mean_norm/layer15": 11.328039467334747, + "mean_norm/layer16": 10.689521372318268, + "mean_norm/layer17": 11.181367576122284, + "mean_norm/layer18": 10.724294066429138, + "mean_norm/layer19": 10.774694919586182, + "mean_norm/layer2": 8.886360824108124, + "mean_norm/layer20": 10.885128438472748, + "mean_norm/layer21": 10.843543469905853, + "mean_norm/layer22": 11.83205932378769, + "mean_norm/layer23": 11.779264986515045, + "mean_norm/layer3": 11.249089777469635, + "mean_norm/layer4": 10.062511086463928, + "mean_norm/layer5": 12.456778228282928, + "mean_norm/layer6": 9.579894959926605, + "mean_norm/layer7": 10.104304015636444, + "mean_norm/layer8": 10.59186977148056, + "mean_norm/layer9": 10.52049970626831, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 9950 + }, + { + "epoch": 4.15, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4647992439452753, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7321929931640625, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5663, + "eval_samples_per_second": 20.836, + "eval_steps_per_second": 0.692, + "step": 9950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.18, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4491, + "max_norm": 34.14283752441406, + "max_norm/layer0": 26.50551986694336, + "max_norm/layer1": 27.7550106048584, + "max_norm/layer10": 29.307462692260742, + "max_norm/layer11": 27.49453353881836, + "max_norm/layer12": 30.52471160888672, + "max_norm/layer13": 26.660375595092773, + "max_norm/layer14": 28.200090408325195, + "max_norm/layer15": 33.45909881591797, + "max_norm/layer16": 27.896703720092773, + "max_norm/layer17": 33.38733673095703, + "max_norm/layer18": 29.413230895996094, + "max_norm/layer19": 28.905559539794922, + "max_norm/layer2": 21.893877029418945, + "max_norm/layer20": 29.715972900390625, + "max_norm/layer21": 29.35295867919922, + "max_norm/layer22": 30.175220489501953, + "max_norm/layer23": 28.85986328125, + "max_norm/layer3": 27.073829650878906, + "max_norm/layer4": 26.81964683532715, + "max_norm/layer5": 34.14283752441406, + "max_norm/layer6": 22.7307071685791, + "max_norm/layer7": 29.045549392700195, + "max_norm/layer8": 28.79771614074707, + "max_norm/layer9": 28.713727951049805, + "mean_norm": 10.791931385795275, + "mean_norm/layer0": 10.409155309200287, + "mean_norm/layer1": 10.2649627327919, + "mean_norm/layer10": 10.620647609233856, + "mean_norm/layer11": 10.938298046588898, + "mean_norm/layer12": 11.488030791282654, + "mean_norm/layer13": 10.61491984128952, + "mean_norm/layer14": 11.007142424583435, + "mean_norm/layer15": 11.340634763240814, + "mean_norm/layer16": 10.699385046958923, + "mean_norm/layer17": 11.192373037338257, + "mean_norm/layer18": 10.733623325824738, + "mean_norm/layer19": 10.784404814243317, + "mean_norm/layer2": 8.890056729316711, + "mean_norm/layer20": 10.89472770690918, + "mean_norm/layer21": 10.853393316268921, + "mean_norm/layer22": 11.845016062259674, + "mean_norm/layer23": 11.792450189590454, + "mean_norm/layer3": 11.262365102767944, + "mean_norm/layer4": 10.070643126964569, + "mean_norm/layer5": 12.47421932220459, + "mean_norm/layer6": 9.5861154794693, + "mean_norm/layer7": 10.112246751785278, + "mean_norm/layer8": 10.601553738117218, + "mean_norm/layer9": 10.52998799085617, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10000 + }, + { + "epoch": 4.18, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46464105652969256, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7348339557647705, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8228, + "eval_samples_per_second": 20.384, + "eval_steps_per_second": 0.677, + "step": 10000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.2, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4329, + "max_norm": 34.24258041381836, + "max_norm/layer0": 26.59330177307129, + "max_norm/layer1": 27.850889205932617, + "max_norm/layer10": 29.392183303833008, + "max_norm/layer11": 27.56389808654785, + "max_norm/layer12": 30.620975494384766, + "max_norm/layer13": 26.739151000976562, + "max_norm/layer14": 28.295047760009766, + "max_norm/layer15": 33.56934356689453, + "max_norm/layer16": 27.998239517211914, + "max_norm/layer17": 33.505916595458984, + "max_norm/layer18": 29.517406463623047, + "max_norm/layer19": 29.00499725341797, + "max_norm/layer2": 21.960556030273438, + "max_norm/layer20": 29.809242248535156, + "max_norm/layer21": 29.433250427246094, + "max_norm/layer22": 30.258737564086914, + "max_norm/layer23": 28.964088439941406, + "max_norm/layer3": 27.16298484802246, + "max_norm/layer4": 26.908559799194336, + "max_norm/layer5": 34.24258041381836, + "max_norm/layer6": 22.788379669189453, + "max_norm/layer7": 29.131332397460938, + "max_norm/layer8": 28.89280128479004, + "max_norm/layer9": 28.82826042175293, + "mean_norm": 10.802442769209543, + "mean_norm/layer0": 10.422712087631226, + "mean_norm/layer1": 10.274647951126099, + "mean_norm/layer10": 10.630156993865967, + "mean_norm/layer11": 10.949021577835083, + "mean_norm/layer12": 11.501543462276459, + "mean_norm/layer13": 10.62501984834671, + "mean_norm/layer14": 11.018203675746918, + "mean_norm/layer15": 11.353238582611084, + "mean_norm/layer16": 10.70931327342987, + "mean_norm/layer17": 11.203383982181549, + "mean_norm/layer18": 10.742836117744446, + "mean_norm/layer19": 10.79411780834198, + "mean_norm/layer2": 8.89378023147583, + "mean_norm/layer20": 10.904330492019653, + "mean_norm/layer21": 10.863244533538818, + "mean_norm/layer22": 11.858083486557007, + "mean_norm/layer23": 11.805590689182281, + "mean_norm/layer3": 11.275679171085358, + "mean_norm/layer4": 10.078687965869904, + "mean_norm/layer5": 12.491709351539612, + "mean_norm/layer6": 9.592344641685486, + "mean_norm/layer7": 10.120253562927246, + "mean_norm/layer8": 10.611266136169434, + "mean_norm/layer9": 10.539460837841034, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10050 + }, + { + "epoch": 4.2, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4653305914181299, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7377023696899414, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8222, + "eval_samples_per_second": 20.385, + "eval_steps_per_second": 0.677, + "step": 10050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.22, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4418, + "max_norm": 34.33783721923828, + "max_norm/layer0": 26.687532424926758, + "max_norm/layer1": 27.943302154541016, + "max_norm/layer10": 29.47475814819336, + "max_norm/layer11": 27.646385192871094, + "max_norm/layer12": 30.71775245666504, + "max_norm/layer13": 26.815946578979492, + "max_norm/layer14": 28.3834228515625, + "max_norm/layer15": 33.6978874206543, + "max_norm/layer16": 28.076602935791016, + "max_norm/layer17": 33.623817443847656, + "max_norm/layer18": 29.62516975402832, + "max_norm/layer19": 29.10083770751953, + "max_norm/layer2": 22.04039192199707, + "max_norm/layer20": 29.9028377532959, + "max_norm/layer21": 29.55206871032715, + "max_norm/layer22": 30.35678482055664, + "max_norm/layer23": 29.040468215942383, + "max_norm/layer3": 27.252946853637695, + "max_norm/layer4": 26.981002807617188, + "max_norm/layer5": 34.33783721923828, + "max_norm/layer6": 22.85585594177246, + "max_norm/layer7": 29.2227840423584, + "max_norm/layer8": 28.991825103759766, + "max_norm/layer9": 28.919313430786133, + "mean_norm": 10.813075611988703, + "mean_norm/layer0": 10.436362564563751, + "mean_norm/layer1": 10.284512996673584, + "mean_norm/layer10": 10.639845430850983, + "mean_norm/layer11": 10.960028350353241, + "mean_norm/layer12": 11.515252709388733, + "mean_norm/layer13": 10.635209619998932, + "mean_norm/layer14": 11.029352128505707, + "mean_norm/layer15": 11.365962743759155, + "mean_norm/layer16": 10.71934300661087, + "mean_norm/layer17": 11.21452122926712, + "mean_norm/layer18": 10.75224620103836, + "mean_norm/layer19": 10.80382651090622, + "mean_norm/layer2": 8.897547483444214, + "mean_norm/layer20": 10.914192497730255, + "mean_norm/layer21": 10.873103141784668, + "mean_norm/layer22": 11.871187806129456, + "mean_norm/layer23": 11.81886202096939, + "mean_norm/layer3": 11.289128601551056, + "mean_norm/layer4": 10.086705446243286, + "mean_norm/layer5": 12.509444057941437, + "mean_norm/layer6": 9.598621368408203, + "mean_norm/layer7": 10.128449976444244, + "mean_norm/layer8": 10.621142864227295, + "mean_norm/layer9": 10.54896593093872, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10100 + }, + { + "epoch": 4.22, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46528597445476044, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7357242107391357, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6332, + "eval_samples_per_second": 20.716, + "eval_steps_per_second": 0.688, + "step": 10100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.24, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4544, + "max_norm": 34.453956604003906, + "max_norm/layer0": 26.772411346435547, + "max_norm/layer1": 28.041337966918945, + "max_norm/layer10": 29.558502197265625, + "max_norm/layer11": 27.715511322021484, + "max_norm/layer12": 30.828214645385742, + "max_norm/layer13": 26.886316299438477, + "max_norm/layer14": 28.47247886657715, + "max_norm/layer15": 33.815494537353516, + "max_norm/layer16": 28.156137466430664, + "max_norm/layer17": 33.7318115234375, + "max_norm/layer18": 29.730388641357422, + "max_norm/layer19": 29.191200256347656, + "max_norm/layer2": 22.100492477416992, + "max_norm/layer20": 29.983238220214844, + "max_norm/layer21": 29.642305374145508, + "max_norm/layer22": 30.443191528320312, + "max_norm/layer23": 29.122554779052734, + "max_norm/layer3": 27.341691970825195, + "max_norm/layer4": 27.058629989624023, + "max_norm/layer5": 34.453956604003906, + "max_norm/layer6": 22.911787033081055, + "max_norm/layer7": 29.31786346435547, + "max_norm/layer8": 29.09516143798828, + "max_norm/layer9": 29.001785278320312, + "mean_norm": 10.823577101031939, + "mean_norm/layer0": 10.449947893619537, + "mean_norm/layer1": 10.294241428375244, + "mean_norm/layer10": 10.649329900741577, + "mean_norm/layer11": 10.97073119878769, + "mean_norm/layer12": 11.528786540031433, + "mean_norm/layer13": 10.64515471458435, + "mean_norm/layer14": 11.040421605110168, + "mean_norm/layer15": 11.378489017486572, + "mean_norm/layer16": 10.729291319847107, + "mean_norm/layer17": 11.22548794746399, + "mean_norm/layer18": 10.761508107185364, + "mean_norm/layer19": 10.813477575778961, + "mean_norm/layer2": 8.90120553970337, + "mean_norm/layer20": 10.923896491527557, + "mean_norm/layer21": 10.882788181304932, + "mean_norm/layer22": 11.884176313877106, + "mean_norm/layer23": 11.831968367099762, + "mean_norm/layer3": 11.302320063114166, + "mean_norm/layer4": 10.094793438911438, + "mean_norm/layer5": 12.52708524465561, + "mean_norm/layer6": 9.604782938957214, + "mean_norm/layer7": 10.136550486087799, + "mean_norm/layer8": 10.630961179733276, + "mean_norm/layer9": 10.558454930782318, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10150 + }, + { + "epoch": 4.24, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46512778703917773, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7335257530212402, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8291, + "eval_samples_per_second": 20.374, + "eval_steps_per_second": 0.676, + "step": 10150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.26, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4673, + "max_norm": 34.58348083496094, + "max_norm/layer0": 26.855865478515625, + "max_norm/layer1": 28.143543243408203, + "max_norm/layer10": 29.672481536865234, + "max_norm/layer11": 27.77507781982422, + "max_norm/layer12": 30.940479278564453, + "max_norm/layer13": 26.968402862548828, + "max_norm/layer14": 28.5567684173584, + "max_norm/layer15": 33.94534683227539, + "max_norm/layer16": 28.248029708862305, + "max_norm/layer17": 33.84120559692383, + "max_norm/layer18": 29.839115142822266, + "max_norm/layer19": 29.27945899963379, + "max_norm/layer2": 22.152008056640625, + "max_norm/layer20": 30.0822811126709, + "max_norm/layer21": 29.724666595458984, + "max_norm/layer22": 30.52536392211914, + "max_norm/layer23": 29.206314086914062, + "max_norm/layer3": 27.427833557128906, + "max_norm/layer4": 27.152973175048828, + "max_norm/layer5": 34.58348083496094, + "max_norm/layer6": 22.977237701416016, + "max_norm/layer7": 29.407623291015625, + "max_norm/layer8": 29.18715476989746, + "max_norm/layer9": 29.0870418548584, + "mean_norm": 10.833997232218584, + "mean_norm/layer0": 10.463428616523743, + "mean_norm/layer1": 10.30388629436493, + "mean_norm/layer10": 10.658759415149689, + "mean_norm/layer11": 10.981380045413971, + "mean_norm/layer12": 11.542144119739532, + "mean_norm/layer13": 10.655113756656647, + "mean_norm/layer14": 11.05135828256607, + "mean_norm/layer15": 11.390934586524963, + "mean_norm/layer16": 10.739136815071106, + "mean_norm/layer17": 11.236359000205994, + "mean_norm/layer18": 10.770753979682922, + "mean_norm/layer19": 10.822953343391418, + "mean_norm/layer2": 8.904917061328888, + "mean_norm/layer20": 10.933463454246521, + "mean_norm/layer21": 10.89233547449112, + "mean_norm/layer22": 11.897063732147217, + "mean_norm/layer23": 11.84492552280426, + "mean_norm/layer3": 11.315583348274231, + "mean_norm/layer4": 10.102841198444366, + "mean_norm/layer5": 12.544600367546082, + "mean_norm/layer6": 9.610954105854034, + "mean_norm/layer7": 10.144558072090149, + "mean_norm/layer8": 10.64060389995575, + "mean_norm/layer9": 10.5678790807724, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10200 + }, + { + "epoch": 4.26, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4655739566728725, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7333078384399414, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8316, + "eval_samples_per_second": 20.369, + "eval_steps_per_second": 0.676, + "step": 10200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.28, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4621, + "max_norm": 34.71388626098633, + "max_norm/layer0": 26.937944412231445, + "max_norm/layer1": 28.25180435180664, + "max_norm/layer10": 29.777528762817383, + "max_norm/layer11": 27.845121383666992, + "max_norm/layer12": 31.053159713745117, + "max_norm/layer13": 27.057754516601562, + "max_norm/layer14": 28.657506942749023, + "max_norm/layer15": 34.0597038269043, + "max_norm/layer16": 28.338624954223633, + "max_norm/layer17": 33.95635986328125, + "max_norm/layer18": 29.946928024291992, + "max_norm/layer19": 29.373924255371094, + "max_norm/layer2": 22.206056594848633, + "max_norm/layer20": 30.173419952392578, + "max_norm/layer21": 29.83626937866211, + "max_norm/layer22": 30.619873046875, + "max_norm/layer23": 29.289323806762695, + "max_norm/layer3": 27.5142822265625, + "max_norm/layer4": 27.233551025390625, + "max_norm/layer5": 34.71388626098633, + "max_norm/layer6": 23.036663055419922, + "max_norm/layer7": 29.503074645996094, + "max_norm/layer8": 29.276399612426758, + "max_norm/layer9": 29.16158676147461, + "mean_norm": 10.844474345445633, + "mean_norm/layer0": 10.477041006088257, + "mean_norm/layer1": 10.313621699810028, + "mean_norm/layer10": 10.668282330036163, + "mean_norm/layer11": 10.992021024227142, + "mean_norm/layer12": 11.555621325969696, + "mean_norm/layer13": 10.665147244930267, + "mean_norm/layer14": 11.062337279319763, + "mean_norm/layer15": 11.403449833393097, + "mean_norm/layer16": 10.74899560213089, + "mean_norm/layer17": 11.247314095497131, + "mean_norm/layer18": 10.77999460697174, + "mean_norm/layer19": 10.832535803318024, + "mean_norm/layer2": 8.908604800701141, + "mean_norm/layer20": 10.942877173423767, + "mean_norm/layer21": 10.901946604251862, + "mean_norm/layer22": 11.90995740890503, + "mean_norm/layer23": 11.857899725437164, + "mean_norm/layer3": 11.328973352909088, + "mean_norm/layer4": 10.11098599433899, + "mean_norm/layer5": 12.562341749668121, + "mean_norm/layer6": 9.61716765165329, + "mean_norm/layer7": 10.1526557803154, + "mean_norm/layer8": 10.65031635761261, + "mean_norm/layer9": 10.57729583978653, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10250 + }, + { + "epoch": 4.28, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.466563642042159, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7261102199554443, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6164, + "eval_samples_per_second": 20.747, + "eval_steps_per_second": 0.689, + "step": 10250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.3, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4588, + "max_norm": 34.85292434692383, + "max_norm/layer0": 27.01976203918457, + "max_norm/layer1": 28.348358154296875, + "max_norm/layer10": 29.854251861572266, + "max_norm/layer11": 27.921520233154297, + "max_norm/layer12": 31.167068481445312, + "max_norm/layer13": 27.163440704345703, + "max_norm/layer14": 28.76555061340332, + "max_norm/layer15": 34.19651412963867, + "max_norm/layer16": 28.430654525756836, + "max_norm/layer17": 34.0618782043457, + "max_norm/layer18": 30.038536071777344, + "max_norm/layer19": 29.47166633605957, + "max_norm/layer2": 22.28195571899414, + "max_norm/layer20": 30.264249801635742, + "max_norm/layer21": 29.946247100830078, + "max_norm/layer22": 30.70496368408203, + "max_norm/layer23": 29.37714195251465, + "max_norm/layer3": 27.59646224975586, + "max_norm/layer4": 27.327890396118164, + "max_norm/layer5": 34.85292434692383, + "max_norm/layer6": 23.106088638305664, + "max_norm/layer7": 29.593017578125, + "max_norm/layer8": 29.365062713623047, + "max_norm/layer9": 29.251405715942383, + "mean_norm": 10.855059415102005, + "mean_norm/layer0": 10.490851998329163, + "mean_norm/layer1": 10.323559045791626, + "mean_norm/layer10": 10.677920937538147, + "mean_norm/layer11": 11.002786934375763, + "mean_norm/layer12": 11.569205522537231, + "mean_norm/layer13": 10.675206542015076, + "mean_norm/layer14": 11.073414862155914, + "mean_norm/layer15": 11.416033565998077, + "mean_norm/layer16": 10.759003520011902, + "mean_norm/layer17": 11.258389592170715, + "mean_norm/layer18": 10.789301872253418, + "mean_norm/layer19": 10.842225074768066, + "mean_norm/layer2": 8.912357330322266, + "mean_norm/layer20": 10.952302515506744, + "mean_norm/layer21": 10.911858797073364, + "mean_norm/layer22": 11.92295503616333, + "mean_norm/layer23": 11.870939314365387, + "mean_norm/layer3": 11.342563092708588, + "mean_norm/layer4": 10.119135022163391, + "mean_norm/layer5": 12.580202519893646, + "mean_norm/layer6": 9.623411118984222, + "mean_norm/layer7": 10.160789787769318, + "mean_norm/layer8": 10.660134971141815, + "mean_norm/layer9": 10.58687698841095, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10300 + }, + { + "epoch": 4.3, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4662594354737307, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7252895832061768, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.611, + "eval_samples_per_second": 20.756, + "eval_steps_per_second": 0.689, + "step": 10300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.32, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4687, + "max_norm": 34.978092193603516, + "max_norm/layer0": 27.09325408935547, + "max_norm/layer1": 28.446916580200195, + "max_norm/layer10": 29.938980102539062, + "max_norm/layer11": 27.996728897094727, + "max_norm/layer12": 31.258825302124023, + "max_norm/layer13": 27.261137008666992, + "max_norm/layer14": 28.864126205444336, + "max_norm/layer15": 34.30337905883789, + "max_norm/layer16": 28.527667999267578, + "max_norm/layer17": 34.16838455200195, + "max_norm/layer18": 30.128267288208008, + "max_norm/layer19": 29.572622299194336, + "max_norm/layer2": 22.346477508544922, + "max_norm/layer20": 30.36367416381836, + "max_norm/layer21": 30.041337966918945, + "max_norm/layer22": 30.79248809814453, + "max_norm/layer23": 29.450716018676758, + "max_norm/layer3": 27.676977157592773, + "max_norm/layer4": 27.40702247619629, + "max_norm/layer5": 34.978092193603516, + "max_norm/layer6": 23.169605255126953, + "max_norm/layer7": 29.688037872314453, + "max_norm/layer8": 29.44434928894043, + "max_norm/layer9": 29.350614547729492, + "mean_norm": 10.865495984752974, + "mean_norm/layer0": 10.50440114736557, + "mean_norm/layer1": 10.333391070365906, + "mean_norm/layer10": 10.68735784292221, + "mean_norm/layer11": 11.013559699058533, + "mean_norm/layer12": 11.582540392875671, + "mean_norm/layer13": 10.6851087808609, + "mean_norm/layer14": 11.084410846233368, + "mean_norm/layer15": 11.428485333919525, + "mean_norm/layer16": 10.768832564353943, + "mean_norm/layer17": 11.269369840621948, + "mean_norm/layer18": 10.798486649990082, + "mean_norm/layer19": 10.851684868335724, + "mean_norm/layer2": 8.916000783443451, + "mean_norm/layer20": 10.961656332015991, + "mean_norm/layer21": 10.921466648578644, + "mean_norm/layer22": 11.935903191566467, + "mean_norm/layer23": 11.883876979351044, + "mean_norm/layer3": 11.355989933013916, + "mean_norm/layer4": 10.12704610824585, + "mean_norm/layer5": 12.597833693027496, + "mean_norm/layer6": 9.629578769207, + "mean_norm/layer7": 10.168816149234772, + "mean_norm/layer8": 10.669798731803894, + "mean_norm/layer9": 10.596307277679443, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10350 + }, + { + "epoch": 4.32, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4666691003192141, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7238152027130127, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.83, + "eval_samples_per_second": 20.372, + "eval_steps_per_second": 0.676, + "step": 10350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.34, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4675, + "max_norm": 35.09250259399414, + "max_norm/layer0": 27.170841217041016, + "max_norm/layer1": 28.54010009765625, + "max_norm/layer10": 30.02427864074707, + "max_norm/layer11": 28.07108497619629, + "max_norm/layer12": 31.37407684326172, + "max_norm/layer13": 27.350177764892578, + "max_norm/layer14": 28.96674156188965, + "max_norm/layer15": 34.41961669921875, + "max_norm/layer16": 28.634737014770508, + "max_norm/layer17": 34.30854034423828, + "max_norm/layer18": 30.215808868408203, + "max_norm/layer19": 29.66392707824707, + "max_norm/layer2": 22.399484634399414, + "max_norm/layer20": 30.463783264160156, + "max_norm/layer21": 30.12825584411621, + "max_norm/layer22": 30.878080368041992, + "max_norm/layer23": 29.53550910949707, + "max_norm/layer3": 27.760766983032227, + "max_norm/layer4": 27.49215316772461, + "max_norm/layer5": 35.09250259399414, + "max_norm/layer6": 23.237085342407227, + "max_norm/layer7": 29.78689956665039, + "max_norm/layer8": 29.529512405395508, + "max_norm/layer9": 29.437997817993164, + "mean_norm": 10.875869582096735, + "mean_norm/layer0": 10.517846643924713, + "mean_norm/layer1": 10.343126773834229, + "mean_norm/layer10": 10.696803987026215, + "mean_norm/layer11": 11.02418839931488, + "mean_norm/layer12": 11.595861494541168, + "mean_norm/layer13": 10.69503504037857, + "mean_norm/layer14": 11.095302939414978, + "mean_norm/layer15": 11.440791726112366, + "mean_norm/layer16": 10.778616189956665, + "mean_norm/layer17": 11.280155301094055, + "mean_norm/layer18": 10.807569742202759, + "mean_norm/layer19": 10.861127018928528, + "mean_norm/layer2": 8.919726192951202, + "mean_norm/layer20": 10.970995128154755, + "mean_norm/layer21": 10.93109941482544, + "mean_norm/layer22": 11.948687732219696, + "mean_norm/layer23": 11.896688163280487, + "mean_norm/layer3": 11.369346380233765, + "mean_norm/layer4": 10.135048031806946, + "mean_norm/layer5": 12.615287721157074, + "mean_norm/layer6": 9.63567179441452, + "mean_norm/layer7": 10.176795840263367, + "mean_norm/layer8": 10.679445087909698, + "mean_norm/layer9": 10.60565322637558, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10400 + }, + { + "epoch": 4.34, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46639734245141823, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.720466136932373, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8264, + "eval_samples_per_second": 20.378, + "eval_steps_per_second": 0.676, + "step": 10400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.36, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4832, + "max_norm": 35.20648193359375, + "max_norm/layer0": 27.249309539794922, + "max_norm/layer1": 28.6260986328125, + "max_norm/layer10": 30.132997512817383, + "max_norm/layer11": 28.141712188720703, + "max_norm/layer12": 31.486787796020508, + "max_norm/layer13": 27.444744110107422, + "max_norm/layer14": 29.066604614257812, + "max_norm/layer15": 34.534122467041016, + "max_norm/layer16": 28.72284698486328, + "max_norm/layer17": 34.44967269897461, + "max_norm/layer18": 30.303834915161133, + "max_norm/layer19": 29.760055541992188, + "max_norm/layer2": 22.440155029296875, + "max_norm/layer20": 30.55260467529297, + "max_norm/layer21": 30.21926498413086, + "max_norm/layer22": 30.969770431518555, + "max_norm/layer23": 29.619102478027344, + "max_norm/layer3": 27.84838104248047, + "max_norm/layer4": 27.581743240356445, + "max_norm/layer5": 35.20648193359375, + "max_norm/layer6": 23.2900447845459, + "max_norm/layer7": 29.881126403808594, + "max_norm/layer8": 29.612140655517578, + "max_norm/layer9": 29.506317138671875, + "mean_norm": 10.886188079913458, + "mean_norm/layer0": 10.531225800514221, + "mean_norm/layer1": 10.35285609960556, + "mean_norm/layer10": 10.706222176551819, + "mean_norm/layer11": 11.034725069999695, + "mean_norm/layer12": 11.609041213989258, + "mean_norm/layer13": 10.704964399337769, + "mean_norm/layer14": 11.106115698814392, + "mean_norm/layer15": 11.453032970428467, + "mean_norm/layer16": 10.78825443983078, + "mean_norm/layer17": 11.290884613990784, + "mean_norm/layer18": 10.816619038581848, + "mean_norm/layer19": 10.870469331741333, + "mean_norm/layer2": 8.923380255699158, + "mean_norm/layer20": 10.980166375637054, + "mean_norm/layer21": 10.9404656291008, + "mean_norm/layer22": 11.961466610431671, + "mean_norm/layer23": 11.909380972385406, + "mean_norm/layer3": 11.38276892900467, + "mean_norm/layer4": 10.14309161901474, + "mean_norm/layer5": 12.632707595825195, + "mean_norm/layer6": 9.641742944717407, + "mean_norm/layer7": 10.184781432151794, + "mean_norm/layer8": 10.689123392105103, + "mean_norm/layer9": 10.61502730846405, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10450 + }, + { + "epoch": 4.36, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4669814190628004, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.727762460708618, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8074, + "eval_samples_per_second": 20.411, + "eval_steps_per_second": 0.678, + "step": 10450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.38, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4735, + "max_norm": 35.31102752685547, + "max_norm/layer0": 27.322124481201172, + "max_norm/layer1": 28.704631805419922, + "max_norm/layer10": 30.22309684753418, + "max_norm/layer11": 28.21150016784668, + "max_norm/layer12": 31.58722686767578, + "max_norm/layer13": 27.54606819152832, + "max_norm/layer14": 29.150634765625, + "max_norm/layer15": 34.65001678466797, + "max_norm/layer16": 28.81109619140625, + "max_norm/layer17": 34.57710266113281, + "max_norm/layer18": 30.40672492980957, + "max_norm/layer19": 29.857248306274414, + "max_norm/layer2": 22.493066787719727, + "max_norm/layer20": 30.625856399536133, + "max_norm/layer21": 30.31292152404785, + "max_norm/layer22": 31.06342887878418, + "max_norm/layer23": 29.703598022460938, + "max_norm/layer3": 27.929664611816406, + "max_norm/layer4": 27.665664672851562, + "max_norm/layer5": 35.31102752685547, + "max_norm/layer6": 23.348833084106445, + "max_norm/layer7": 29.977657318115234, + "max_norm/layer8": 29.692916870117188, + "max_norm/layer9": 29.58916473388672, + "mean_norm": 10.896445403496424, + "mean_norm/layer0": 10.544557332992554, + "mean_norm/layer1": 10.36272656917572, + "mean_norm/layer10": 10.715586066246033, + "mean_norm/layer11": 11.045181214809418, + "mean_norm/layer12": 11.622164130210876, + "mean_norm/layer13": 10.71480655670166, + "mean_norm/layer14": 11.11687183380127, + "mean_norm/layer15": 11.465251564979553, + "mean_norm/layer16": 10.797833800315857, + "mean_norm/layer17": 11.301512777805328, + "mean_norm/layer18": 10.825657427310944, + "mean_norm/layer19": 10.87968373298645, + "mean_norm/layer2": 8.926989018917084, + "mean_norm/layer20": 10.989526093006134, + "mean_norm/layer21": 10.949874520301819, + "mean_norm/layer22": 11.974126279354095, + "mean_norm/layer23": 11.922089457511902, + "mean_norm/layer3": 11.395866453647614, + "mean_norm/layer4": 10.151008665561676, + "mean_norm/layer5": 12.650058627128601, + "mean_norm/layer6": 9.647817850112915, + "mean_norm/layer7": 10.19264006614685, + "mean_norm/layer8": 10.698614120483398, + "mean_norm/layer9": 10.624245524406433, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10500 + }, + { + "epoch": 4.38, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46716394300385733, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.722189426422119, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8232, + "eval_samples_per_second": 20.384, + "eval_steps_per_second": 0.677, + "step": 10500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.41, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4798, + "max_norm": 35.41484069824219, + "max_norm/layer0": 27.402650833129883, + "max_norm/layer1": 28.785425186157227, + "max_norm/layer10": 30.307842254638672, + "max_norm/layer11": 28.27923011779785, + "max_norm/layer12": 31.686256408691406, + "max_norm/layer13": 27.649747848510742, + "max_norm/layer14": 29.226646423339844, + "max_norm/layer15": 34.76811599731445, + "max_norm/layer16": 28.895538330078125, + "max_norm/layer17": 34.68964385986328, + "max_norm/layer18": 30.481956481933594, + "max_norm/layer19": 29.93875503540039, + "max_norm/layer2": 22.53553009033203, + "max_norm/layer20": 30.70552635192871, + "max_norm/layer21": 30.40555763244629, + "max_norm/layer22": 31.15724754333496, + "max_norm/layer23": 29.78316879272461, + "max_norm/layer3": 28.027681350708008, + "max_norm/layer4": 27.753910064697266, + "max_norm/layer5": 35.41484069824219, + "max_norm/layer6": 23.405353546142578, + "max_norm/layer7": 30.058359146118164, + "max_norm/layer8": 29.767122268676758, + "max_norm/layer9": 29.67656135559082, + "mean_norm": 10.90666925907135, + "mean_norm/layer0": 10.55777508020401, + "mean_norm/layer1": 10.37240594625473, + "mean_norm/layer10": 10.724979639053345, + "mean_norm/layer11": 11.055671870708466, + "mean_norm/layer12": 11.635342717170715, + "mean_norm/layer13": 10.724624454975128, + "mean_norm/layer14": 11.127586245536804, + "mean_norm/layer15": 11.477472305297852, + "mean_norm/layer16": 10.807492911815643, + "mean_norm/layer17": 11.312130510807037, + "mean_norm/layer18": 10.83464765548706, + "mean_norm/layer19": 10.888959348201752, + "mean_norm/layer2": 8.930633246898651, + "mean_norm/layer20": 10.998526573181152, + "mean_norm/layer21": 10.959003448486328, + "mean_norm/layer22": 11.986606121063232, + "mean_norm/layer23": 11.93477600812912, + "mean_norm/layer3": 11.40896886587143, + "mean_norm/layer4": 10.158946633338928, + "mean_norm/layer5": 12.667472839355469, + "mean_norm/layer6": 9.653771996498108, + "mean_norm/layer7": 10.20052433013916, + "mean_norm/layer8": 10.7082160115242, + "mean_norm/layer9": 10.63352745771408, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10550 + }, + { + "epoch": 4.41, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4674235326089161, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7157599925994873, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8578, + "eval_samples_per_second": 20.324, + "eval_steps_per_second": 0.675, + "step": 10550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.43, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4831, + "max_norm": 35.51637649536133, + "max_norm/layer0": 27.475908279418945, + "max_norm/layer1": 28.86876106262207, + "max_norm/layer10": 30.390464782714844, + "max_norm/layer11": 28.36003303527832, + "max_norm/layer12": 31.778034210205078, + "max_norm/layer13": 27.747234344482422, + "max_norm/layer14": 29.308727264404297, + "max_norm/layer15": 34.87663650512695, + "max_norm/layer16": 28.978439331054688, + "max_norm/layer17": 34.80805587768555, + "max_norm/layer18": 30.56378173828125, + "max_norm/layer19": 30.048263549804688, + "max_norm/layer2": 22.57395362854004, + "max_norm/layer20": 30.787128448486328, + "max_norm/layer21": 30.525808334350586, + "max_norm/layer22": 31.266019821166992, + "max_norm/layer23": 29.866968154907227, + "max_norm/layer3": 28.12118911743164, + "max_norm/layer4": 27.834333419799805, + "max_norm/layer5": 35.51637649536133, + "max_norm/layer6": 23.4639835357666, + "max_norm/layer7": 30.14113998413086, + "max_norm/layer8": 29.85468864440918, + "max_norm/layer9": 29.7611026763916, + "mean_norm": 10.916920227309069, + "mean_norm/layer0": 10.570904314517975, + "mean_norm/layer1": 10.38205361366272, + "mean_norm/layer10": 10.734330654144287, + "mean_norm/layer11": 11.066179275512695, + "mean_norm/layer12": 11.64851301908493, + "mean_norm/layer13": 10.73451679944992, + "mean_norm/layer14": 11.138398826122284, + "mean_norm/layer15": 11.48961079120636, + "mean_norm/layer16": 10.817120850086212, + "mean_norm/layer17": 11.322860479354858, + "mean_norm/layer18": 10.843526363372803, + "mean_norm/layer19": 10.898203313350677, + "mean_norm/layer2": 8.934328258037567, + "mean_norm/layer20": 11.007682263851166, + "mean_norm/layer21": 10.968221306800842, + "mean_norm/layer22": 11.999272584915161, + "mean_norm/layer23": 11.947436928749084, + "mean_norm/layer3": 11.422153949737549, + "mean_norm/layer4": 10.166811406612396, + "mean_norm/layer5": 12.684915959835052, + "mean_norm/layer6": 9.659890413284302, + "mean_norm/layer7": 10.20842158794403, + "mean_norm/layer8": 10.717842519283295, + "mean_norm/layer9": 10.642889976501465, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10600 + }, + { + "epoch": 4.43, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4667339977204788, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7145159244537354, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8076, + "eval_samples_per_second": 20.411, + "eval_steps_per_second": 0.678, + "step": 10600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.45, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4806, + "max_norm": 35.609092712402344, + "max_norm/layer0": 27.55437660217285, + "max_norm/layer1": 28.942262649536133, + "max_norm/layer10": 30.47496795654297, + "max_norm/layer11": 28.428438186645508, + "max_norm/layer12": 31.868505477905273, + "max_norm/layer13": 27.855722427368164, + "max_norm/layer14": 29.389577865600586, + "max_norm/layer15": 34.96714401245117, + "max_norm/layer16": 29.079998016357422, + "max_norm/layer17": 34.91963577270508, + "max_norm/layer18": 30.655733108520508, + "max_norm/layer19": 30.14913558959961, + "max_norm/layer2": 22.608745574951172, + "max_norm/layer20": 30.87098503112793, + "max_norm/layer21": 30.627986907958984, + "max_norm/layer22": 31.354114532470703, + "max_norm/layer23": 29.948514938354492, + "max_norm/layer3": 28.209653854370117, + "max_norm/layer4": 27.917613983154297, + "max_norm/layer5": 35.609092712402344, + "max_norm/layer6": 23.53098487854004, + "max_norm/layer7": 30.23145294189453, + "max_norm/layer8": 29.94053840637207, + "max_norm/layer9": 29.844087600708008, + "mean_norm": 10.927273042500019, + "mean_norm/layer0": 10.584196090698242, + "mean_norm/layer1": 10.391879200935364, + "mean_norm/layer10": 10.74368441104889, + "mean_norm/layer11": 11.076675713062286, + "mean_norm/layer12": 11.661826848983765, + "mean_norm/layer13": 10.744428396224976, + "mean_norm/layer14": 11.149281024932861, + "mean_norm/layer15": 11.501932203769684, + "mean_norm/layer16": 10.826817870140076, + "mean_norm/layer17": 11.333656907081604, + "mean_norm/layer18": 10.852577328681946, + "mean_norm/layer19": 10.907494246959686, + "mean_norm/layer2": 8.938007533550262, + "mean_norm/layer20": 11.017000377178192, + "mean_norm/layer21": 10.977705717086792, + "mean_norm/layer22": 12.012137532234192, + "mean_norm/layer23": 11.960254788398743, + "mean_norm/layer3": 11.435484945774078, + "mean_norm/layer4": 10.174837708473206, + "mean_norm/layer5": 12.702556490898132, + "mean_norm/layer6": 9.666034281253815, + "mean_norm/layer7": 10.216350853443146, + "mean_norm/layer8": 10.727464079856873, + "mean_norm/layer9": 10.652268469333649, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10650 + }, + { + "epoch": 4.45, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46697736297522136, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7170541286468506, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.7982, + "eval_samples_per_second": 20.427, + "eval_steps_per_second": 0.678, + "step": 10650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.47, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4783, + "max_norm": 35.705467224121094, + "max_norm/layer0": 27.62490463256836, + "max_norm/layer1": 29.019390106201172, + "max_norm/layer10": 30.577533721923828, + "max_norm/layer11": 28.49982452392578, + "max_norm/layer12": 31.976930618286133, + "max_norm/layer13": 27.960256576538086, + "max_norm/layer14": 29.463733673095703, + "max_norm/layer15": 35.0821647644043, + "max_norm/layer16": 29.184551239013672, + "max_norm/layer17": 35.04167175292969, + "max_norm/layer18": 30.749788284301758, + "max_norm/layer19": 30.25857162475586, + "max_norm/layer2": 22.64493751525879, + "max_norm/layer20": 30.958097457885742, + "max_norm/layer21": 30.731101989746094, + "max_norm/layer22": 31.439579010009766, + "max_norm/layer23": 30.029600143432617, + "max_norm/layer3": 28.30475616455078, + "max_norm/layer4": 28.00230598449707, + "max_norm/layer5": 35.705467224121094, + "max_norm/layer6": 23.597314834594727, + "max_norm/layer7": 30.324081420898438, + "max_norm/layer8": 30.024124145507812, + "max_norm/layer9": 29.914560317993164, + "mean_norm": 10.937589218219122, + "mean_norm/layer0": 10.597443342208862, + "mean_norm/layer1": 10.40154081583023, + "mean_norm/layer10": 10.753035068511963, + "mean_norm/layer11": 11.087162613868713, + "mean_norm/layer12": 11.675267100334167, + "mean_norm/layer13": 10.754276752471924, + "mean_norm/layer14": 11.160140216350555, + "mean_norm/layer15": 11.5142263174057, + "mean_norm/layer16": 10.836543262004852, + "mean_norm/layer17": 11.34443885087967, + "mean_norm/layer18": 10.861545503139496, + "mean_norm/layer19": 10.916850566864014, + "mean_norm/layer2": 8.94169694185257, + "mean_norm/layer20": 11.026383817195892, + "mean_norm/layer21": 10.987124800682068, + "mean_norm/layer22": 12.02495139837265, + "mean_norm/layer23": 11.972956240177155, + "mean_norm/layer3": 11.448661506175995, + "mean_norm/layer4": 10.182782769203186, + "mean_norm/layer5": 12.720122337341309, + "mean_norm/layer6": 9.672084748744965, + "mean_norm/layer7": 10.224287867546082, + "mean_norm/layer8": 10.737088739871979, + "mean_norm/layer9": 10.661529660224915, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10700 + }, + { + "epoch": 4.47, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4673667473828095, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7178053855895996, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8381, + "eval_samples_per_second": 20.358, + "eval_steps_per_second": 0.676, + "step": 10700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.49, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4828, + "max_norm": 35.80092239379883, + "max_norm/layer0": 27.704483032226562, + "max_norm/layer1": 29.09988021850586, + "max_norm/layer10": 30.672069549560547, + "max_norm/layer11": 28.57552719116211, + "max_norm/layer12": 32.09391403198242, + "max_norm/layer13": 28.066116333007812, + "max_norm/layer14": 29.550426483154297, + "max_norm/layer15": 35.199127197265625, + "max_norm/layer16": 29.278635025024414, + "max_norm/layer17": 35.16794204711914, + "max_norm/layer18": 30.849281311035156, + "max_norm/layer19": 30.358570098876953, + "max_norm/layer2": 22.691360473632812, + "max_norm/layer20": 31.052244186401367, + "max_norm/layer21": 30.848957061767578, + "max_norm/layer22": 31.532005310058594, + "max_norm/layer23": 30.109872817993164, + "max_norm/layer3": 28.392465591430664, + "max_norm/layer4": 28.095552444458008, + "max_norm/layer5": 35.80092239379883, + "max_norm/layer6": 23.654541015625, + "max_norm/layer7": 30.412067413330078, + "max_norm/layer8": 30.113658905029297, + "max_norm/layer9": 29.99777603149414, + "mean_norm": 10.947911076247692, + "mean_norm/layer0": 10.610689520835876, + "mean_norm/layer1": 10.411279439926147, + "mean_norm/layer10": 10.762393414974213, + "mean_norm/layer11": 11.097654044628143, + "mean_norm/layer12": 11.688684284687042, + "mean_norm/layer13": 10.764097929000854, + "mean_norm/layer14": 11.170956254005432, + "mean_norm/layer15": 11.526572465896606, + "mean_norm/layer16": 10.846267402172089, + "mean_norm/layer17": 11.355244040489197, + "mean_norm/layer18": 10.870476722717285, + "mean_norm/layer19": 10.926155745983124, + "mean_norm/layer2": 8.945383906364441, + "mean_norm/layer20": 11.035573720932007, + "mean_norm/layer21": 10.996546864509583, + "mean_norm/layer22": 12.03775930404663, + "mean_norm/layer23": 11.985740721225739, + "mean_norm/layer3": 11.461913466453552, + "mean_norm/layer4": 10.19075322151184, + "mean_norm/layer5": 12.737750947475433, + "mean_norm/layer6": 9.67819058895111, + "mean_norm/layer7": 10.232214033603668, + "mean_norm/layer8": 10.746669948101044, + "mean_norm/layer9": 10.670897841453552, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10750 + }, + { + "epoch": 4.49, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4685267884304158, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7106406688690186, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8382, + "eval_samples_per_second": 20.358, + "eval_steps_per_second": 0.676, + "step": 10750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.51, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4824, + "max_norm": 35.902252197265625, + "max_norm/layer0": 27.77450180053711, + "max_norm/layer1": 29.19710922241211, + "max_norm/layer10": 30.76256561279297, + "max_norm/layer11": 28.64341926574707, + "max_norm/layer12": 32.20515823364258, + "max_norm/layer13": 28.149314880371094, + "max_norm/layer14": 29.625675201416016, + "max_norm/layer15": 35.318763732910156, + "max_norm/layer16": 29.381330490112305, + "max_norm/layer17": 35.283477783203125, + "max_norm/layer18": 30.946577072143555, + "max_norm/layer19": 30.443479537963867, + "max_norm/layer2": 22.751590728759766, + "max_norm/layer20": 31.136180877685547, + "max_norm/layer21": 30.948503494262695, + "max_norm/layer22": 31.631589889526367, + "max_norm/layer23": 30.19828224182129, + "max_norm/layer3": 28.473833084106445, + "max_norm/layer4": 28.17934226989746, + "max_norm/layer5": 35.902252197265625, + "max_norm/layer6": 23.716323852539062, + "max_norm/layer7": 30.506010055541992, + "max_norm/layer8": 30.187671661376953, + "max_norm/layer9": 30.072362899780273, + "mean_norm": 10.958240871628126, + "mean_norm/layer0": 10.623964190483093, + "mean_norm/layer1": 10.421046495437622, + "mean_norm/layer10": 10.771743476390839, + "mean_norm/layer11": 11.10817575454712, + "mean_norm/layer12": 11.702056527137756, + "mean_norm/layer13": 10.774037420749664, + "mean_norm/layer14": 11.181804180145264, + "mean_norm/layer15": 11.53890997171402, + "mean_norm/layer16": 10.85598087310791, + "mean_norm/layer17": 11.366090714931488, + "mean_norm/layer18": 10.879380404949188, + "mean_norm/layer19": 10.935488760471344, + "mean_norm/layer2": 8.94908481836319, + "mean_norm/layer20": 11.04500299692154, + "mean_norm/layer21": 11.00584191083908, + "mean_norm/layer22": 12.050399005413055, + "mean_norm/layer23": 11.998490035533905, + "mean_norm/layer3": 11.475232481956482, + "mean_norm/layer4": 10.198665499687195, + "mean_norm/layer5": 12.75539767742157, + "mean_norm/layer6": 9.684304535388947, + "mean_norm/layer7": 10.240188002586365, + "mean_norm/layer8": 10.756260454654694, + "mean_norm/layer9": 10.680234730243683, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10800 + }, + { + "epoch": 4.51, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4672450647554382, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7115914821624756, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8271, + "eval_samples_per_second": 20.377, + "eval_steps_per_second": 0.676, + "step": 10800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.53, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4838, + "max_norm": 36.001617431640625, + "max_norm/layer0": 27.83734893798828, + "max_norm/layer1": 29.293045043945312, + "max_norm/layer10": 30.840595245361328, + "max_norm/layer11": 28.707897186279297, + "max_norm/layer12": 32.31393814086914, + "max_norm/layer13": 28.230504989624023, + "max_norm/layer14": 29.70939826965332, + "max_norm/layer15": 35.45550537109375, + "max_norm/layer16": 29.47163963317871, + "max_norm/layer17": 35.38703536987305, + "max_norm/layer18": 31.027469635009766, + "max_norm/layer19": 30.52695655822754, + "max_norm/layer2": 22.79546356201172, + "max_norm/layer20": 31.22841453552246, + "max_norm/layer21": 31.03502655029297, + "max_norm/layer22": 31.733074188232422, + "max_norm/layer23": 30.28806495666504, + "max_norm/layer3": 28.55718421936035, + "max_norm/layer4": 28.254390716552734, + "max_norm/layer5": 36.001617431640625, + "max_norm/layer6": 23.774742126464844, + "max_norm/layer7": 30.59893798828125, + "max_norm/layer8": 30.25242042541504, + "max_norm/layer9": 30.142948150634766, + "mean_norm": 10.968432190517584, + "mean_norm/layer0": 10.637080550193787, + "mean_norm/layer1": 10.430836737155914, + "mean_norm/layer10": 10.781019687652588, + "mean_norm/layer11": 11.118514716625214, + "mean_norm/layer12": 11.715137422084808, + "mean_norm/layer13": 10.78377228975296, + "mean_norm/layer14": 11.192479372024536, + "mean_norm/layer15": 11.551107704639435, + "mean_norm/layer16": 10.865435600280762, + "mean_norm/layer17": 11.376686751842499, + "mean_norm/layer18": 10.888093769550323, + "mean_norm/layer19": 10.944684505462646, + "mean_norm/layer2": 8.952727675437927, + "mean_norm/layer20": 11.054252862930298, + "mean_norm/layer21": 11.015106618404388, + "mean_norm/layer22": 12.062939047813416, + "mean_norm/layer23": 12.011112213134766, + "mean_norm/layer3": 11.488403975963593, + "mean_norm/layer4": 10.206504702568054, + "mean_norm/layer5": 12.77285772562027, + "mean_norm/layer6": 9.69041132926941, + "mean_norm/layer7": 10.248039662837982, + "mean_norm/layer8": 10.765750110149384, + "mean_norm/layer9": 10.689417541027069, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10850 + }, + { + "epoch": 4.53, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46874987324726314, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7068047523498535, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8269, + "eval_samples_per_second": 20.377, + "eval_steps_per_second": 0.676, + "step": 10850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.55, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4766, + "max_norm": 36.10050964355469, + "max_norm/layer0": 27.90643882751465, + "max_norm/layer1": 29.393217086791992, + "max_norm/layer10": 30.925491333007812, + "max_norm/layer11": 28.774173736572266, + "max_norm/layer12": 32.422420501708984, + "max_norm/layer13": 28.32280921936035, + "max_norm/layer14": 29.791353225708008, + "max_norm/layer15": 35.58605194091797, + "max_norm/layer16": 29.558443069458008, + "max_norm/layer17": 35.482425689697266, + "max_norm/layer18": 31.133277893066406, + "max_norm/layer19": 30.631622314453125, + "max_norm/layer2": 22.839784622192383, + "max_norm/layer20": 31.314443588256836, + "max_norm/layer21": 31.123477935791016, + "max_norm/layer22": 31.825902938842773, + "max_norm/layer23": 30.378795623779297, + "max_norm/layer3": 28.63979148864746, + "max_norm/layer4": 28.323528289794922, + "max_norm/layer5": 36.10050964355469, + "max_norm/layer6": 23.828092575073242, + "max_norm/layer7": 30.709747314453125, + "max_norm/layer8": 30.32479476928711, + "max_norm/layer9": 30.2420654296875, + "mean_norm": 10.978607185184956, + "mean_norm/layer0": 10.650204837322235, + "mean_norm/layer1": 10.440573155879974, + "mean_norm/layer10": 10.79030156135559, + "mean_norm/layer11": 11.128903448581696, + "mean_norm/layer12": 11.7282093167305, + "mean_norm/layer13": 10.793516874313354, + "mean_norm/layer14": 11.203150153160095, + "mean_norm/layer15": 11.563211679458618, + "mean_norm/layer16": 10.874927461147308, + "mean_norm/layer17": 11.387232065200806, + "mean_norm/layer18": 10.896808683872223, + "mean_norm/layer19": 10.953786313533783, + "mean_norm/layer2": 8.956369996070862, + "mean_norm/layer20": 11.063383102416992, + "mean_norm/layer21": 11.024434506893158, + "mean_norm/layer22": 12.075482964515686, + "mean_norm/layer23": 12.023701608181, + "mean_norm/layer3": 11.501590967178345, + "mean_norm/layer4": 10.214413344860077, + "mean_norm/layer5": 12.790341198444366, + "mean_norm/layer6": 9.696370244026184, + "mean_norm/layer7": 10.255893349647522, + "mean_norm/layer8": 10.775194346904755, + "mean_norm/layer9": 10.698571264743805, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10900 + }, + { + "epoch": 4.55, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46807250662156297, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7072505950927734, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.5674, + "eval_samples_per_second": 20.834, + "eval_steps_per_second": 0.692, + "step": 10900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.57, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4951, + "max_norm": 36.194454193115234, + "max_norm/layer0": 27.984460830688477, + "max_norm/layer1": 29.48598289489746, + "max_norm/layer10": 31.01220703125, + "max_norm/layer11": 28.84075164794922, + "max_norm/layer12": 32.5153694152832, + "max_norm/layer13": 28.403606414794922, + "max_norm/layer14": 29.87116241455078, + "max_norm/layer15": 35.694305419921875, + "max_norm/layer16": 29.650407791137695, + "max_norm/layer17": 35.60575866699219, + "max_norm/layer18": 31.23323631286621, + "max_norm/layer19": 30.72925567626953, + "max_norm/layer2": 22.884504318237305, + "max_norm/layer20": 31.395549774169922, + "max_norm/layer21": 31.2160587310791, + "max_norm/layer22": 31.92021369934082, + "max_norm/layer23": 30.462398529052734, + "max_norm/layer3": 28.742555618286133, + "max_norm/layer4": 28.39634132385254, + "max_norm/layer5": 36.194454193115234, + "max_norm/layer6": 23.88254737854004, + "max_norm/layer7": 30.820144653320312, + "max_norm/layer8": 30.39653205871582, + "max_norm/layer9": 30.330341339111328, + "mean_norm": 10.98867952823639, + "mean_norm/layer0": 10.663160026073456, + "mean_norm/layer1": 10.450208723545074, + "mean_norm/layer10": 10.79953122138977, + "mean_norm/layer11": 11.139248013496399, + "mean_norm/layer12": 11.741204142570496, + "mean_norm/layer13": 10.803188383579254, + "mean_norm/layer14": 11.21361792087555, + "mean_norm/layer15": 11.575240135192871, + "mean_norm/layer16": 10.88437169790268, + "mean_norm/layer17": 11.39776086807251, + "mean_norm/layer18": 10.905632257461548, + "mean_norm/layer19": 10.962841093540192, + "mean_norm/layer2": 8.959905982017517, + "mean_norm/layer20": 11.072368741035461, + "mean_norm/layer21": 11.033558368682861, + "mean_norm/layer22": 12.0879687666893, + "mean_norm/layer23": 12.036184847354889, + "mean_norm/layer3": 11.514626264572144, + "mean_norm/layer4": 10.222147405147552, + "mean_norm/layer5": 12.807550191879272, + "mean_norm/layer6": 9.702159464359283, + "mean_norm/layer7": 10.263650834560394, + "mean_norm/layer8": 10.784475028514862, + "mean_norm/layer9": 10.707708299160004, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 10950 + }, + { + "epoch": 4.57, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4685105640800996, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7058496475219727, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8398, + "eval_samples_per_second": 20.355, + "eval_steps_per_second": 0.676, + "step": 10950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.59, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4968, + "max_norm": 36.29143142700195, + "max_norm/layer0": 28.067821502685547, + "max_norm/layer1": 29.572872161865234, + "max_norm/layer10": 31.0950927734375, + "max_norm/layer11": 28.908004760742188, + "max_norm/layer12": 32.61347579956055, + "max_norm/layer13": 28.48408317565918, + "max_norm/layer14": 29.953489303588867, + "max_norm/layer15": 35.82485580444336, + "max_norm/layer16": 29.73497200012207, + "max_norm/layer17": 35.71292495727539, + "max_norm/layer18": 31.33292579650879, + "max_norm/layer19": 30.821983337402344, + "max_norm/layer2": 22.939258575439453, + "max_norm/layer20": 31.488800048828125, + "max_norm/layer21": 31.312997817993164, + "max_norm/layer22": 32.024410247802734, + "max_norm/layer23": 30.548397064208984, + "max_norm/layer3": 28.828319549560547, + "max_norm/layer4": 28.46470832824707, + "max_norm/layer5": 36.29143142700195, + "max_norm/layer6": 23.948667526245117, + "max_norm/layer7": 30.933961868286133, + "max_norm/layer8": 30.480300903320312, + "max_norm/layer9": 30.43441390991211, + "mean_norm": 10.99889350682497, + "mean_norm/layer0": 10.676221072673798, + "mean_norm/layer1": 10.459985494613647, + "mean_norm/layer10": 10.808838605880737, + "mean_norm/layer11": 11.149834871292114, + "mean_norm/layer12": 11.754562199115753, + "mean_norm/layer13": 10.812919557094574, + "mean_norm/layer14": 11.22424590587616, + "mean_norm/layer15": 11.587432563304901, + "mean_norm/layer16": 10.893988728523254, + "mean_norm/layer17": 11.408426642417908, + "mean_norm/layer18": 10.914457440376282, + "mean_norm/layer19": 10.971990644931793, + "mean_norm/layer2": 8.963540971279144, + "mean_norm/layer20": 11.081362009048462, + "mean_norm/layer21": 11.042804539203644, + "mean_norm/layer22": 12.100537717342377, + "mean_norm/layer23": 12.048828661441803, + "mean_norm/layer3": 11.527796804904938, + "mean_norm/layer4": 10.23012900352478, + "mean_norm/layer5": 12.824970602989197, + "mean_norm/layer6": 9.708126485347748, + "mean_norm/layer7": 10.271549999713898, + "mean_norm/layer8": 10.793979287147522, + "mean_norm/layer9": 10.716914355754852, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11000 + }, + { + "epoch": 4.59, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46899323850200575, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.708869218826294, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8407, + "eval_samples_per_second": 20.354, + "eval_steps_per_second": 0.676, + "step": 11000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.61, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5027, + "max_norm": 36.38948440551758, + "max_norm/layer0": 28.142681121826172, + "max_norm/layer1": 29.65342903137207, + "max_norm/layer10": 31.172306060791016, + "max_norm/layer11": 28.979270935058594, + "max_norm/layer12": 32.718421936035156, + "max_norm/layer13": 28.559803009033203, + "max_norm/layer14": 30.038625717163086, + "max_norm/layer15": 35.952938079833984, + "max_norm/layer16": 29.816696166992188, + "max_norm/layer17": 35.83388900756836, + "max_norm/layer18": 31.439905166625977, + "max_norm/layer19": 30.919139862060547, + "max_norm/layer2": 22.99624252319336, + "max_norm/layer20": 31.571073532104492, + "max_norm/layer21": 31.403352737426758, + "max_norm/layer22": 32.12685012817383, + "max_norm/layer23": 30.628877639770508, + "max_norm/layer3": 28.90157699584961, + "max_norm/layer4": 28.525489807128906, + "max_norm/layer5": 36.38948440551758, + "max_norm/layer6": 24.00628662109375, + "max_norm/layer7": 31.039264678955078, + "max_norm/layer8": 30.567359924316406, + "max_norm/layer9": 30.537586212158203, + "mean_norm": 11.008995535473028, + "mean_norm/layer0": 10.68915969133377, + "mean_norm/layer1": 10.46977412700653, + "mean_norm/layer10": 10.818095445632935, + "mean_norm/layer11": 11.16015911102295, + "mean_norm/layer12": 11.767687618732452, + "mean_norm/layer13": 10.822493731975555, + "mean_norm/layer14": 11.234766364097595, + "mean_norm/layer15": 11.599426746368408, + "mean_norm/layer16": 10.903450429439545, + "mean_norm/layer17": 11.418922483921051, + "mean_norm/layer18": 10.923265159130096, + "mean_norm/layer19": 10.981090009212494, + "mean_norm/layer2": 8.967131793498993, + "mean_norm/layer20": 11.090291917324066, + "mean_norm/layer21": 11.05186927318573, + "mean_norm/layer22": 12.113010346889496, + "mean_norm/layer23": 12.061234652996063, + "mean_norm/layer3": 11.540878176689148, + "mean_norm/layer4": 10.238067269325256, + "mean_norm/layer5": 12.84223461151123, + "mean_norm/layer6": 9.714037954807281, + "mean_norm/layer7": 10.279354095458984, + "mean_norm/layer8": 10.803401052951813, + "mean_norm/layer9": 10.726090788841248, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11050 + }, + { + "epoch": 4.61, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4690013506771638, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7019741535186768, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6244, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 0.688, + "step": 11050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.63, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4867, + "max_norm": 36.485416412353516, + "max_norm/layer0": 28.211668014526367, + "max_norm/layer1": 29.72883415222168, + "max_norm/layer10": 31.23760986328125, + "max_norm/layer11": 29.053224563598633, + "max_norm/layer12": 32.811614990234375, + "max_norm/layer13": 28.64307975769043, + "max_norm/layer14": 30.11770248413086, + "max_norm/layer15": 36.074459075927734, + "max_norm/layer16": 29.89780044555664, + "max_norm/layer17": 35.94729232788086, + "max_norm/layer18": 31.554128646850586, + "max_norm/layer19": 31.01970100402832, + "max_norm/layer2": 23.0423641204834, + "max_norm/layer20": 31.650583267211914, + "max_norm/layer21": 31.490772247314453, + "max_norm/layer22": 32.22224426269531, + "max_norm/layer23": 30.71469497680664, + "max_norm/layer3": 28.968250274658203, + "max_norm/layer4": 28.582042694091797, + "max_norm/layer5": 36.485416412353516, + "max_norm/layer6": 24.07797622680664, + "max_norm/layer7": 31.14894676208496, + "max_norm/layer8": 30.651403427124023, + "max_norm/layer9": 30.636816024780273, + "mean_norm": 11.019032259782156, + "mean_norm/layer0": 10.701907813549042, + "mean_norm/layer1": 10.479356586933136, + "mean_norm/layer10": 10.827310979366302, + "mean_norm/layer11": 11.170374512672424, + "mean_norm/layer12": 11.780598878860474, + "mean_norm/layer13": 10.83207768201828, + "mean_norm/layer14": 11.245192289352417, + "mean_norm/layer15": 11.61131465435028, + "mean_norm/layer16": 10.912882566452026, + "mean_norm/layer17": 11.429385244846344, + "mean_norm/layer18": 10.932092487812042, + "mean_norm/layer19": 10.990167617797852, + "mean_norm/layer2": 8.970707833766937, + "mean_norm/layer20": 11.099395036697388, + "mean_norm/layer21": 11.060913383960724, + "mean_norm/layer22": 12.12530916929245, + "mean_norm/layer23": 12.073706030845642, + "mean_norm/layer3": 11.553913176059723, + "mean_norm/layer4": 10.24598515033722, + "mean_norm/layer5": 12.85935389995575, + "mean_norm/layer6": 9.71992015838623, + "mean_norm/layer7": 10.287022113800049, + "mean_norm/layer8": 10.812736868858337, + "mean_norm/layer9": 10.73515009880066, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11100 + }, + { + "epoch": 4.63, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4689810702392686, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.702160596847534, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8364, + "eval_samples_per_second": 20.361, + "eval_steps_per_second": 0.676, + "step": 11100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.66, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4907, + "max_norm": 36.590641021728516, + "max_norm/layer0": 28.281400680541992, + "max_norm/layer1": 29.814014434814453, + "max_norm/layer10": 31.30912971496582, + "max_norm/layer11": 29.127084732055664, + "max_norm/layer12": 32.911705017089844, + "max_norm/layer13": 28.726318359375, + "max_norm/layer14": 30.1971435546875, + "max_norm/layer15": 36.19831085205078, + "max_norm/layer16": 29.989545822143555, + "max_norm/layer17": 36.075653076171875, + "max_norm/layer18": 31.639633178710938, + "max_norm/layer19": 31.121540069580078, + "max_norm/layer2": 23.09928321838379, + "max_norm/layer20": 31.74033546447754, + "max_norm/layer21": 31.588829040527344, + "max_norm/layer22": 32.31295394897461, + "max_norm/layer23": 30.793426513671875, + "max_norm/layer3": 29.041465759277344, + "max_norm/layer4": 28.63759994506836, + "max_norm/layer5": 36.590641021728516, + "max_norm/layer6": 24.13155746459961, + "max_norm/layer7": 31.24675178527832, + "max_norm/layer8": 30.736846923828125, + "max_norm/layer9": 30.751882553100586, + "mean_norm": 11.029068134725094, + "mean_norm/layer0": 10.71463930606842, + "mean_norm/layer1": 10.488974511623383, + "mean_norm/layer10": 10.836424171924591, + "mean_norm/layer11": 11.180540084838867, + "mean_norm/layer12": 11.793593287467957, + "mean_norm/layer13": 10.841667890548706, + "mean_norm/layer14": 11.255710542201996, + "mean_norm/layer15": 11.62320464849472, + "mean_norm/layer16": 10.922313868999481, + "mean_norm/layer17": 11.43975281715393, + "mean_norm/layer18": 10.94078254699707, + "mean_norm/layer19": 10.999189674854279, + "mean_norm/layer2": 8.97431856393814, + "mean_norm/layer20": 11.108398020267487, + "mean_norm/layer21": 11.070019721984863, + "mean_norm/layer22": 12.137679636478424, + "mean_norm/layer23": 12.086146414279938, + "mean_norm/layer3": 11.566857933998108, + "mean_norm/layer4": 10.25378680229187, + "mean_norm/layer5": 12.876568496227264, + "mean_norm/layer6": 9.725827276706696, + "mean_norm/layer7": 10.294805943965912, + "mean_norm/layer8": 10.822121918201447, + "mean_norm/layer9": 10.744311153888702, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11150 + }, + { + "epoch": 4.66, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46954892250033464, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.702021360397339, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8177, + "eval_samples_per_second": 20.393, + "eval_steps_per_second": 0.677, + "step": 11150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.68, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4889, + "max_norm": 36.693843841552734, + "max_norm/layer0": 28.353055953979492, + "max_norm/layer1": 29.90206527709961, + "max_norm/layer10": 31.385793685913086, + "max_norm/layer11": 29.21958351135254, + "max_norm/layer12": 33.02078628540039, + "max_norm/layer13": 28.812292098999023, + "max_norm/layer14": 30.27202606201172, + "max_norm/layer15": 36.33440399169922, + "max_norm/layer16": 30.099519729614258, + "max_norm/layer17": 36.19306564331055, + "max_norm/layer18": 31.73409652709961, + "max_norm/layer19": 31.216930389404297, + "max_norm/layer2": 23.159343719482422, + "max_norm/layer20": 31.83723258972168, + "max_norm/layer21": 31.70283317565918, + "max_norm/layer22": 32.40229034423828, + "max_norm/layer23": 30.87533187866211, + "max_norm/layer3": 29.103801727294922, + "max_norm/layer4": 28.69968605041504, + "max_norm/layer5": 36.693843841552734, + "max_norm/layer6": 24.19968032836914, + "max_norm/layer7": 31.33868980407715, + "max_norm/layer8": 30.82036018371582, + "max_norm/layer9": 30.858015060424805, + "mean_norm": 11.039107086757818, + "mean_norm/layer0": 10.727317333221436, + "mean_norm/layer1": 10.498592138290405, + "mean_norm/layer10": 10.845584452152252, + "mean_norm/layer11": 11.190867006778717, + "mean_norm/layer12": 11.806601226329803, + "mean_norm/layer13": 10.851321637630463, + "mean_norm/layer14": 11.26624971628189, + "mean_norm/layer15": 11.63513070344925, + "mean_norm/layer16": 10.931711971759796, + "mean_norm/layer17": 11.450206220149994, + "mean_norm/layer18": 10.949472665786743, + "mean_norm/layer19": 11.008228719234467, + "mean_norm/layer2": 8.977922022342682, + "mean_norm/layer20": 11.11731094121933, + "mean_norm/layer21": 11.079086363315582, + "mean_norm/layer22": 12.150035500526428, + "mean_norm/layer23": 12.098583281040192, + "mean_norm/layer3": 11.579851865768433, + "mean_norm/layer4": 10.261609435081482, + "mean_norm/layer5": 12.89377510547638, + "mean_norm/layer6": 9.731728971004486, + "mean_norm/layer7": 10.302535831928253, + "mean_norm/layer8": 10.831456780433655, + "mean_norm/layer9": 10.753390192985535, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11200 + }, + { + "epoch": 4.68, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4700640456228731, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7000200748443604, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8823, + "eval_samples_per_second": 20.282, + "eval_steps_per_second": 0.673, + "step": 11200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.7, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4911, + "max_norm": 36.80110168457031, + "max_norm/layer0": 28.42072105407715, + "max_norm/layer1": 29.987051010131836, + "max_norm/layer10": 31.46202850341797, + "max_norm/layer11": 29.302335739135742, + "max_norm/layer12": 33.13109588623047, + "max_norm/layer13": 28.901945114135742, + "max_norm/layer14": 30.360057830810547, + "max_norm/layer15": 36.44215393066406, + "max_norm/layer16": 30.18164825439453, + "max_norm/layer17": 36.3160285949707, + "max_norm/layer18": 31.817520141601562, + "max_norm/layer19": 31.32172966003418, + "max_norm/layer2": 23.22319984436035, + "max_norm/layer20": 31.919742584228516, + "max_norm/layer21": 31.79605484008789, + "max_norm/layer22": 32.49842834472656, + "max_norm/layer23": 30.966951370239258, + "max_norm/layer3": 29.168514251708984, + "max_norm/layer4": 28.76665496826172, + "max_norm/layer5": 36.80110168457031, + "max_norm/layer6": 24.263078689575195, + "max_norm/layer7": 31.429777145385742, + "max_norm/layer8": 30.894712448120117, + "max_norm/layer9": 30.976171493530273, + "mean_norm": 11.049177487691244, + "mean_norm/layer0": 10.739985823631287, + "mean_norm/layer1": 10.5082568526268, + "mean_norm/layer10": 10.85473507642746, + "mean_norm/layer11": 11.201318681240082, + "mean_norm/layer12": 11.819770455360413, + "mean_norm/layer13": 10.861029326915741, + "mean_norm/layer14": 11.276723444461823, + "mean_norm/layer15": 11.647155404090881, + "mean_norm/layer16": 10.941185355186462, + "mean_norm/layer17": 11.46070909500122, + "mean_norm/layer18": 10.958095967769623, + "mean_norm/layer19": 11.017280280590057, + "mean_norm/layer2": 8.981531858444214, + "mean_norm/layer20": 11.126353204250336, + "mean_norm/layer21": 11.088174939155579, + "mean_norm/layer22": 12.162321031093597, + "mean_norm/layer23": 12.111066281795502, + "mean_norm/layer3": 11.59280115365982, + "mean_norm/layer4": 10.269557535648346, + "mean_norm/layer5": 12.910930395126343, + "mean_norm/layer6": 9.737641453742981, + "mean_norm/layer7": 10.310417890548706, + "mean_norm/layer8": 10.840794563293457, + "mean_norm/layer9": 10.762423634529114, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11250 + }, + { + "epoch": 4.7, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4693420620338034, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6996147632598877, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.838, + "eval_samples_per_second": 20.358, + "eval_steps_per_second": 0.676, + "step": 11250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.72, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4906, + "max_norm": 36.90290832519531, + "max_norm/layer0": 28.498428344726562, + "max_norm/layer1": 30.071109771728516, + "max_norm/layer10": 31.552982330322266, + "max_norm/layer11": 29.381942749023438, + "max_norm/layer12": 33.24612045288086, + "max_norm/layer13": 28.998634338378906, + "max_norm/layer14": 30.43010902404785, + "max_norm/layer15": 36.54443359375, + "max_norm/layer16": 30.27066993713379, + "max_norm/layer17": 36.46219253540039, + "max_norm/layer18": 31.914384841918945, + "max_norm/layer19": 31.426963806152344, + "max_norm/layer2": 23.282331466674805, + "max_norm/layer20": 32.007347106933594, + "max_norm/layer21": 31.882448196411133, + "max_norm/layer22": 32.59296417236328, + "max_norm/layer23": 31.06037712097168, + "max_norm/layer3": 29.24478530883789, + "max_norm/layer4": 28.834274291992188, + "max_norm/layer5": 36.90290832519531, + "max_norm/layer6": 24.324382781982422, + "max_norm/layer7": 31.510684967041016, + "max_norm/layer8": 30.968204498291016, + "max_norm/layer9": 31.075193405151367, + "mean_norm": 11.05928177634875, + "mean_norm/layer0": 10.7528635263443, + "mean_norm/layer1": 10.51784473657608, + "mean_norm/layer10": 10.863938212394714, + "mean_norm/layer11": 11.211776793003082, + "mean_norm/layer12": 11.832974255084991, + "mean_norm/layer13": 10.870778441429138, + "mean_norm/layer14": 11.287272453308105, + "mean_norm/layer15": 11.65920740365982, + "mean_norm/layer16": 10.950676381587982, + "mean_norm/layer17": 11.471208274364471, + "mean_norm/layer18": 10.96678340435028, + "mean_norm/layer19": 11.026268124580383, + "mean_norm/layer2": 8.985169887542725, + "mean_norm/layer20": 11.135346353054047, + "mean_norm/layer21": 11.097164869308472, + "mean_norm/layer22": 12.174674391746521, + "mean_norm/layer23": 12.123576819896698, + "mean_norm/layer3": 11.605943202972412, + "mean_norm/layer4": 10.27738219499588, + "mean_norm/layer5": 12.928228676319122, + "mean_norm/layer6": 9.743575870990753, + "mean_norm/layer7": 10.318305909633636, + "mean_norm/layer8": 10.850202322006226, + "mean_norm/layer9": 10.771600127220154, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11300 + }, + { + "epoch": 4.72, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46931366942075015, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.702225923538208, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8556, + "eval_samples_per_second": 20.328, + "eval_steps_per_second": 0.675, + "step": 11300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.74, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5083, + "max_norm": 36.998252868652344, + "max_norm/layer0": 28.57436180114746, + "max_norm/layer1": 30.16019058227539, + "max_norm/layer10": 31.637813568115234, + "max_norm/layer11": 29.452293395996094, + "max_norm/layer12": 33.34236145019531, + "max_norm/layer13": 29.110563278198242, + "max_norm/layer14": 30.50075340270996, + "max_norm/layer15": 36.65324783325195, + "max_norm/layer16": 30.35845184326172, + "max_norm/layer17": 36.59389877319336, + "max_norm/layer18": 32.02538299560547, + "max_norm/layer19": 31.53948211669922, + "max_norm/layer2": 23.335365295410156, + "max_norm/layer20": 32.10725402832031, + "max_norm/layer21": 31.964698791503906, + "max_norm/layer22": 32.67811584472656, + "max_norm/layer23": 31.14203643798828, + "max_norm/layer3": 29.3145809173584, + "max_norm/layer4": 28.908462524414062, + "max_norm/layer5": 36.998252868652344, + "max_norm/layer6": 24.38912010192871, + "max_norm/layer7": 31.59634017944336, + "max_norm/layer8": 31.052322387695312, + "max_norm/layer9": 31.170902252197266, + "mean_norm": 11.069261901080608, + "mean_norm/layer0": 10.765595376491547, + "mean_norm/layer1": 10.527443945407867, + "mean_norm/layer10": 10.873034358024597, + "mean_norm/layer11": 11.221920251846313, + "mean_norm/layer12": 11.84593778848648, + "mean_norm/layer13": 10.880328059196472, + "mean_norm/layer14": 11.29772400856018, + "mean_norm/layer15": 11.67112535238266, + "mean_norm/layer16": 10.96004843711853, + "mean_norm/layer17": 11.481589019298553, + "mean_norm/layer18": 10.9753977060318, + "mean_norm/layer19": 11.03517997264862, + "mean_norm/layer2": 8.98877876996994, + "mean_norm/layer20": 11.144243478775024, + "mean_norm/layer21": 11.106104969978333, + "mean_norm/layer22": 12.18696117401123, + "mean_norm/layer23": 12.135864198207855, + "mean_norm/layer3": 11.618866682052612, + "mean_norm/layer4": 10.285234451293945, + "mean_norm/layer5": 12.945219874382019, + "mean_norm/layer6": 9.74939090013504, + "mean_norm/layer7": 10.32614415884018, + "mean_norm/layer8": 10.859492838382721, + "mean_norm/layer9": 10.780659854412079, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11350 + }, + { + "epoch": 4.74, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.470055933447715, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.698378086090088, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8271, + "eval_samples_per_second": 20.377, + "eval_steps_per_second": 0.676, + "step": 11350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.76, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4982, + "max_norm": 37.1029052734375, + "max_norm/layer0": 28.656028747558594, + "max_norm/layer1": 30.25836181640625, + "max_norm/layer10": 31.71713638305664, + "max_norm/layer11": 29.52212905883789, + "max_norm/layer12": 33.44416427612305, + "max_norm/layer13": 29.218441009521484, + "max_norm/layer14": 30.57339859008789, + "max_norm/layer15": 36.7493896484375, + "max_norm/layer16": 30.460256576538086, + "max_norm/layer17": 36.72866439819336, + "max_norm/layer18": 32.121299743652344, + "max_norm/layer19": 31.664583206176758, + "max_norm/layer2": 23.3944091796875, + "max_norm/layer20": 32.202659606933594, + "max_norm/layer21": 32.049556732177734, + "max_norm/layer22": 32.76599884033203, + "max_norm/layer23": 31.217979431152344, + "max_norm/layer3": 29.3818416595459, + "max_norm/layer4": 28.99262046813965, + "max_norm/layer5": 37.1029052734375, + "max_norm/layer6": 24.457334518432617, + "max_norm/layer7": 31.686601638793945, + "max_norm/layer8": 31.13671112060547, + "max_norm/layer9": 31.269529342651367, + "mean_norm": 11.079338165620962, + "mean_norm/layer0": 10.778338432312012, + "mean_norm/layer1": 10.537169218063354, + "mean_norm/layer10": 10.882223546504974, + "mean_norm/layer11": 11.232254266738892, + "mean_norm/layer12": 11.85909241437912, + "mean_norm/layer13": 10.889939963817596, + "mean_norm/layer14": 11.308136761188507, + "mean_norm/layer15": 11.683177769184113, + "mean_norm/layer16": 10.969454109668732, + "mean_norm/layer17": 11.491996049880981, + "mean_norm/layer18": 10.984146773815155, + "mean_norm/layer19": 11.04429715871811, + "mean_norm/layer2": 8.992380321025848, + "mean_norm/layer20": 11.153231382369995, + "mean_norm/layer21": 11.115254282951355, + "mean_norm/layer22": 12.199417114257812, + "mean_norm/layer23": 12.148304343223572, + "mean_norm/layer3": 11.631822049617767, + "mean_norm/layer4": 10.293142974376678, + "mean_norm/layer5": 12.962431788444519, + "mean_norm/layer6": 9.755285799503326, + "mean_norm/layer7": 10.333933413028717, + "mean_norm/layer8": 10.86891096830368, + "mean_norm/layer9": 10.78977507352829, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11400 + }, + { + "epoch": 4.76, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4695732590258089, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.696803092956543, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8371, + "eval_samples_per_second": 20.36, + "eval_steps_per_second": 0.676, + "step": 11400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.78, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4981, + "max_norm": 37.19981384277344, + "max_norm/layer0": 28.733051300048828, + "max_norm/layer1": 30.349668502807617, + "max_norm/layer10": 31.805160522460938, + "max_norm/layer11": 29.594594955444336, + "max_norm/layer12": 33.550926208496094, + "max_norm/layer13": 29.31583595275879, + "max_norm/layer14": 30.652856826782227, + "max_norm/layer15": 36.8530387878418, + "max_norm/layer16": 30.553306579589844, + "max_norm/layer17": 36.866615295410156, + "max_norm/layer18": 32.23554992675781, + "max_norm/layer19": 31.7749080657959, + "max_norm/layer2": 23.452619552612305, + "max_norm/layer20": 32.29941177368164, + "max_norm/layer21": 32.140113830566406, + "max_norm/layer22": 32.85822677612305, + "max_norm/layer23": 31.301639556884766, + "max_norm/layer3": 29.454954147338867, + "max_norm/layer4": 29.073352813720703, + "max_norm/layer5": 37.19981384277344, + "max_norm/layer6": 24.528331756591797, + "max_norm/layer7": 31.778316497802734, + "max_norm/layer8": 31.21552085876465, + "max_norm/layer9": 31.349042892456055, + "mean_norm": 11.089381170769533, + "mean_norm/layer0": 10.790962219238281, + "mean_norm/layer1": 10.546747326850891, + "mean_norm/layer10": 10.89135366678238, + "mean_norm/layer11": 11.24245822429657, + "mean_norm/layer12": 11.872169077396393, + "mean_norm/layer13": 10.899617612361908, + "mean_norm/layer14": 11.318670332431793, + "mean_norm/layer15": 11.695177555084229, + "mean_norm/layer16": 10.97891902923584, + "mean_norm/layer17": 11.502409100532532, + "mean_norm/layer18": 10.992907166481018, + "mean_norm/layer19": 11.053321421146393, + "mean_norm/layer2": 8.995991051197052, + "mean_norm/layer20": 11.16218513250351, + "mean_norm/layer21": 11.124274849891663, + "mean_norm/layer22": 12.21173882484436, + "mean_norm/layer23": 12.160701274871826, + "mean_norm/layer3": 11.644759356975555, + "mean_norm/layer4": 10.301061511039734, + "mean_norm/layer5": 12.979609191417694, + "mean_norm/layer6": 9.761213302612305, + "mean_norm/layer7": 10.34174370765686, + "mean_norm/layer8": 10.878252863883972, + "mean_norm/layer9": 10.798904299736023, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11450 + }, + { + "epoch": 4.78, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4699666995209761, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6955602169036865, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6354, + "eval_samples_per_second": 20.713, + "eval_steps_per_second": 0.688, + "step": 11450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.8, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5003, + "max_norm": 37.291603088378906, + "max_norm/layer0": 28.814542770385742, + "max_norm/layer1": 30.436798095703125, + "max_norm/layer10": 31.88617706298828, + "max_norm/layer11": 29.67328453063965, + "max_norm/layer12": 33.657833099365234, + "max_norm/layer13": 29.41160011291504, + "max_norm/layer14": 30.73747444152832, + "max_norm/layer15": 36.9760856628418, + "max_norm/layer16": 30.654407501220703, + "max_norm/layer17": 36.99338912963867, + "max_norm/layer18": 32.32841110229492, + "max_norm/layer19": 31.86827850341797, + "max_norm/layer2": 23.515026092529297, + "max_norm/layer20": 32.38021469116211, + "max_norm/layer21": 32.233619689941406, + "max_norm/layer22": 32.957420349121094, + "max_norm/layer23": 31.38813018798828, + "max_norm/layer3": 29.526674270629883, + "max_norm/layer4": 29.14989471435547, + "max_norm/layer5": 37.291603088378906, + "max_norm/layer6": 24.593555450439453, + "max_norm/layer7": 31.88994026184082, + "max_norm/layer8": 31.295120239257812, + "max_norm/layer9": 31.42879295349121, + "mean_norm": 11.099412376681963, + "mean_norm/layer0": 10.803522825241089, + "mean_norm/layer1": 10.556218922138214, + "mean_norm/layer10": 10.900573432445526, + "mean_norm/layer11": 11.252809882164001, + "mean_norm/layer12": 11.885180056095123, + "mean_norm/layer13": 10.90925019979477, + "mean_norm/layer14": 11.329178392887115, + "mean_norm/layer15": 11.707133948802948, + "mean_norm/layer16": 10.988328516483307, + "mean_norm/layer17": 11.51287591457367, + "mean_norm/layer18": 11.001640021800995, + "mean_norm/layer19": 11.062367856502533, + "mean_norm/layer2": 8.999559462070465, + "mean_norm/layer20": 11.171233415603638, + "mean_norm/layer21": 11.133346021175385, + "mean_norm/layer22": 12.224068105220795, + "mean_norm/layer23": 12.173038482666016, + "mean_norm/layer3": 11.657609105110168, + "mean_norm/layer4": 10.308907628059387, + "mean_norm/layer5": 12.996685802936554, + "mean_norm/layer6": 9.767203569412231, + "mean_norm/layer7": 10.3494833111763, + "mean_norm/layer8": 10.887590944766998, + "mean_norm/layer9": 10.808091223239899, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11500 + }, + { + "epoch": 4.8, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4696584368649688, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6966724395751953, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8337, + "eval_samples_per_second": 20.366, + "eval_steps_per_second": 0.676, + "step": 11500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.82, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5146, + "max_norm": 37.38665008544922, + "max_norm/layer0": 28.893375396728516, + "max_norm/layer1": 30.520029067993164, + "max_norm/layer10": 31.96396255493164, + "max_norm/layer11": 29.7481632232666, + "max_norm/layer12": 33.75273513793945, + "max_norm/layer13": 29.522672653198242, + "max_norm/layer14": 30.82471466064453, + "max_norm/layer15": 37.11414337158203, + "max_norm/layer16": 30.747474670410156, + "max_norm/layer17": 37.13072204589844, + "max_norm/layer18": 32.423282623291016, + "max_norm/layer19": 31.967445373535156, + "max_norm/layer2": 23.584957122802734, + "max_norm/layer20": 32.46532440185547, + "max_norm/layer21": 32.333984375, + "max_norm/layer22": 33.03456497192383, + "max_norm/layer23": 31.466445922851562, + "max_norm/layer3": 29.594579696655273, + "max_norm/layer4": 29.243301391601562, + "max_norm/layer5": 37.38665008544922, + "max_norm/layer6": 24.651927947998047, + "max_norm/layer7": 31.993391036987305, + "max_norm/layer8": 31.371482849121094, + "max_norm/layer9": 31.511945724487305, + "mean_norm": 11.10927926003933, + "mean_norm/layer0": 10.81601083278656, + "mean_norm/layer1": 10.565600395202637, + "mean_norm/layer10": 10.909658670425415, + "mean_norm/layer11": 11.262958586215973, + "mean_norm/layer12": 11.898052752017975, + "mean_norm/layer13": 10.91872924566269, + "mean_norm/layer14": 11.339493930339813, + "mean_norm/layer15": 11.718998372554779, + "mean_norm/layer16": 10.997642517089844, + "mean_norm/layer17": 11.523203492164612, + "mean_norm/layer18": 11.01017940044403, + "mean_norm/layer19": 11.071209847927094, + "mean_norm/layer2": 9.003080189228058, + "mean_norm/layer20": 11.179914832115173, + "mean_norm/layer21": 11.142175793647766, + "mean_norm/layer22": 12.23628032207489, + "mean_norm/layer23": 12.185180723667145, + "mean_norm/layer3": 11.6702880859375, + "mean_norm/layer4": 10.316582083702087, + "mean_norm/layer5": 13.013548851013184, + "mean_norm/layer6": 9.772991418838501, + "mean_norm/layer7": 10.357124924659729, + "mean_norm/layer8": 10.896804749965668, + "mean_norm/layer9": 10.816992223262787, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11550 + }, + { + "epoch": 4.82, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47042098132982885, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.691270589828491, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6472, + "eval_samples_per_second": 20.692, + "eval_steps_per_second": 0.687, + "step": 11550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.84, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5026, + "max_norm": 37.47762680053711, + "max_norm/layer0": 28.971616744995117, + "max_norm/layer1": 30.603607177734375, + "max_norm/layer10": 32.050777435302734, + "max_norm/layer11": 29.829021453857422, + "max_norm/layer12": 33.8441162109375, + "max_norm/layer13": 29.632450103759766, + "max_norm/layer14": 30.915212631225586, + "max_norm/layer15": 37.232913970947266, + "max_norm/layer16": 30.840450286865234, + "max_norm/layer17": 37.286354064941406, + "max_norm/layer18": 32.52165985107422, + "max_norm/layer19": 32.06243896484375, + "max_norm/layer2": 23.63981819152832, + "max_norm/layer20": 32.5574836730957, + "max_norm/layer21": 32.43302536010742, + "max_norm/layer22": 33.13492202758789, + "max_norm/layer23": 31.543638229370117, + "max_norm/layer3": 29.668012619018555, + "max_norm/layer4": 29.327556610107422, + "max_norm/layer5": 37.47762680053711, + "max_norm/layer6": 24.719707489013672, + "max_norm/layer7": 32.09111022949219, + "max_norm/layer8": 31.45081901550293, + "max_norm/layer9": 31.5856876373291, + "mean_norm": 11.11912084867557, + "mean_norm/layer0": 10.828483998775482, + "mean_norm/layer1": 10.574886500835419, + "mean_norm/layer10": 10.918683588504791, + "mean_norm/layer11": 11.27305418252945, + "mean_norm/layer12": 11.910798013210297, + "mean_norm/layer13": 10.928040564060211, + "mean_norm/layer14": 11.349718570709229, + "mean_norm/layer15": 11.730824649333954, + "mean_norm/layer16": 11.00691682100296, + "mean_norm/layer17": 11.53353351354599, + "mean_norm/layer18": 11.018724083900452, + "mean_norm/layer19": 11.080044209957123, + "mean_norm/layer2": 9.00660353899002, + "mean_norm/layer20": 11.188700079917908, + "mean_norm/layer21": 11.151018679141998, + "mean_norm/layer22": 12.248418152332306, + "mean_norm/layer23": 12.19741666316986, + "mean_norm/layer3": 11.682981371879578, + "mean_norm/layer4": 10.324283599853516, + "mean_norm/layer5": 13.030375838279724, + "mean_norm/layer6": 9.778766095638275, + "mean_norm/layer7": 10.364711105823517, + "mean_norm/layer8": 10.906016230583191, + "mean_norm/layer9": 10.825900316238403, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11600 + }, + { + "epoch": 4.84, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47171892935512266, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.687462568283081, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8212, + "eval_samples_per_second": 22.271, + "eval_steps_per_second": 0.739, + "step": 11600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.86, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5085, + "max_norm": 37.56265640258789, + "max_norm/layer0": 29.0488224029541, + "max_norm/layer1": 30.683454513549805, + "max_norm/layer10": 32.14421844482422, + "max_norm/layer11": 29.910310745239258, + "max_norm/layer12": 33.934776306152344, + "max_norm/layer13": 29.738357543945312, + "max_norm/layer14": 30.991455078125, + "max_norm/layer15": 37.36259841918945, + "max_norm/layer16": 30.928890228271484, + "max_norm/layer17": 37.42397689819336, + "max_norm/layer18": 32.626399993896484, + "max_norm/layer19": 32.142608642578125, + "max_norm/layer2": 23.6883544921875, + "max_norm/layer20": 32.648311614990234, + "max_norm/layer21": 32.51786804199219, + "max_norm/layer22": 33.245933532714844, + "max_norm/layer23": 31.61872673034668, + "max_norm/layer3": 29.742652893066406, + "max_norm/layer4": 29.407451629638672, + "max_norm/layer5": 37.56265640258789, + "max_norm/layer6": 24.781131744384766, + "max_norm/layer7": 32.19428253173828, + "max_norm/layer8": 31.526046752929688, + "max_norm/layer9": 31.649673461914062, + "mean_norm": 11.12895734856526, + "mean_norm/layer0": 10.840919971466064, + "mean_norm/layer1": 10.584234595298767, + "mean_norm/layer10": 10.927650392055511, + "mean_norm/layer11": 11.283041536808014, + "mean_norm/layer12": 11.923579931259155, + "mean_norm/layer13": 10.937540829181671, + "mean_norm/layer14": 11.360036492347717, + "mean_norm/layer15": 11.742550194263458, + "mean_norm/layer16": 11.016173362731934, + "mean_norm/layer17": 11.543751299381256, + "mean_norm/layer18": 11.027178168296814, + "mean_norm/layer19": 11.088969767093658, + "mean_norm/layer2": 9.010113298892975, + "mean_norm/layer20": 11.197400689125061, + "mean_norm/layer21": 11.159915804862976, + "mean_norm/layer22": 12.260593712329865, + "mean_norm/layer23": 12.209560513496399, + "mean_norm/layer3": 11.695660948753357, + "mean_norm/layer4": 10.331953763961792, + "mean_norm/layer5": 13.04720538854599, + "mean_norm/layer6": 9.784554660320282, + "mean_norm/layer7": 10.37237673997879, + "mean_norm/layer8": 10.91523164510727, + "mean_norm/layer9": 10.834782660007477, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11650 + }, + { + "epoch": 4.86, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47108617969279193, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6874008178710938, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8478, + "eval_samples_per_second": 20.341, + "eval_steps_per_second": 0.675, + "step": 11650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.89, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5063, + "max_norm": 37.657135009765625, + "max_norm/layer0": 29.120641708374023, + "max_norm/layer1": 30.76626205444336, + "max_norm/layer10": 32.23412322998047, + "max_norm/layer11": 29.978626251220703, + "max_norm/layer12": 34.04027557373047, + "max_norm/layer13": 29.84294891357422, + "max_norm/layer14": 31.073169708251953, + "max_norm/layer15": 37.47862243652344, + "max_norm/layer16": 31.013898849487305, + "max_norm/layer17": 37.55109786987305, + "max_norm/layer18": 32.71333694458008, + "max_norm/layer19": 32.22544860839844, + "max_norm/layer2": 23.74456214904785, + "max_norm/layer20": 32.7411003112793, + "max_norm/layer21": 32.6014518737793, + "max_norm/layer22": 33.357295989990234, + "max_norm/layer23": 31.693147659301758, + "max_norm/layer3": 29.81475257873535, + "max_norm/layer4": 29.48421287536621, + "max_norm/layer5": 37.657135009765625, + "max_norm/layer6": 24.843406677246094, + "max_norm/layer7": 32.288936614990234, + "max_norm/layer8": 31.590938568115234, + "max_norm/layer9": 31.715600967407227, + "mean_norm": 11.138802573084831, + "mean_norm/layer0": 10.853290915489197, + "mean_norm/layer1": 10.593591392040253, + "mean_norm/layer10": 10.93671852350235, + "mean_norm/layer11": 11.29314911365509, + "mean_norm/layer12": 11.936418116092682, + "mean_norm/layer13": 10.9469895362854, + "mean_norm/layer14": 11.370279312133789, + "mean_norm/layer15": 11.754273056983948, + "mean_norm/layer16": 11.025372207164764, + "mean_norm/layer17": 11.554012775421143, + "mean_norm/layer18": 11.035687029361725, + "mean_norm/layer19": 11.097853183746338, + "mean_norm/layer2": 9.013607859611511, + "mean_norm/layer20": 11.206229448318481, + "mean_norm/layer21": 11.168822050094604, + "mean_norm/layer22": 12.272729098796844, + "mean_norm/layer23": 12.221702218055725, + "mean_norm/layer3": 11.708347916603088, + "mean_norm/layer4": 10.339655816555023, + "mean_norm/layer5": 13.06405371427536, + "mean_norm/layer6": 9.790289580821991, + "mean_norm/layer7": 10.380003929138184, + "mean_norm/layer8": 10.924476206302643, + "mean_norm/layer9": 10.843708753585815, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11700 + }, + { + "epoch": 4.89, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47012488693655874, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.693180561065674, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8334, + "eval_samples_per_second": 20.366, + "eval_steps_per_second": 0.676, + "step": 11700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.91, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5059, + "max_norm": 37.756587982177734, + "max_norm/layer0": 29.19428253173828, + "max_norm/layer1": 30.85544204711914, + "max_norm/layer10": 32.325218200683594, + "max_norm/layer11": 30.0484619140625, + "max_norm/layer12": 34.143394470214844, + "max_norm/layer13": 29.933761596679688, + "max_norm/layer14": 31.147777557373047, + "max_norm/layer15": 37.59746551513672, + "max_norm/layer16": 31.10285758972168, + "max_norm/layer17": 37.67106628417969, + "max_norm/layer18": 32.811126708984375, + "max_norm/layer19": 32.30681610107422, + "max_norm/layer2": 23.80467987060547, + "max_norm/layer20": 32.834537506103516, + "max_norm/layer21": 32.69060516357422, + "max_norm/layer22": 33.47240447998047, + "max_norm/layer23": 31.775291442871094, + "max_norm/layer3": 29.894990921020508, + "max_norm/layer4": 29.559480667114258, + "max_norm/layer5": 37.756587982177734, + "max_norm/layer6": 24.900632858276367, + "max_norm/layer7": 32.3841552734375, + "max_norm/layer8": 31.64830780029297, + "max_norm/layer9": 31.78627586364746, + "mean_norm": 11.148543067276478, + "mean_norm/layer0": 10.865490138530731, + "mean_norm/layer1": 10.602823853492737, + "mean_norm/layer10": 10.94576382637024, + "mean_norm/layer11": 11.303158342838287, + "mean_norm/layer12": 11.949087858200073, + "mean_norm/layer13": 10.956337213516235, + "mean_norm/layer14": 11.380485773086548, + "mean_norm/layer15": 11.765974640846252, + "mean_norm/layer16": 11.034591972827911, + "mean_norm/layer17": 11.564175546169281, + "mean_norm/layer18": 11.04419356584549, + "mean_norm/layer19": 11.106570959091187, + "mean_norm/layer2": 9.01699161529541, + "mean_norm/layer20": 11.21491664648056, + "mean_norm/layer21": 11.177606880664825, + "mean_norm/layer22": 12.284631669521332, + "mean_norm/layer23": 12.233553946018219, + "mean_norm/layer3": 11.720988273620605, + "mean_norm/layer4": 10.347264647483826, + "mean_norm/layer5": 13.080726027488708, + "mean_norm/layer6": 9.79598182439804, + "mean_norm/layer7": 10.387580871582031, + "mean_norm/layer8": 10.933634042739868, + "mean_norm/layer9": 10.852503478527069, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11750 + }, + { + "epoch": 4.91, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46984501689360475, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.688762903213501, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6509, + "eval_samples_per_second": 20.685, + "eval_steps_per_second": 0.687, + "step": 11750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.93, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5079, + "max_norm": 37.85048294067383, + "max_norm/layer0": 29.263450622558594, + "max_norm/layer1": 30.939136505126953, + "max_norm/layer10": 32.416481018066406, + "max_norm/layer11": 30.116899490356445, + "max_norm/layer12": 34.24009323120117, + "max_norm/layer13": 30.03861427307129, + "max_norm/layer14": 31.231199264526367, + "max_norm/layer15": 37.69263458251953, + "max_norm/layer16": 31.176904678344727, + "max_norm/layer17": 37.800819396972656, + "max_norm/layer18": 32.89786911010742, + "max_norm/layer19": 32.403892517089844, + "max_norm/layer2": 23.873645782470703, + "max_norm/layer20": 32.9393424987793, + "max_norm/layer21": 32.77646255493164, + "max_norm/layer22": 33.565677642822266, + "max_norm/layer23": 31.855518341064453, + "max_norm/layer3": 29.965782165527344, + "max_norm/layer4": 29.643163681030273, + "max_norm/layer5": 37.85048294067383, + "max_norm/layer6": 24.967506408691406, + "max_norm/layer7": 32.4691162109375, + "max_norm/layer8": 31.7069034576416, + "max_norm/layer9": 31.866910934448242, + "mean_norm": 11.158328091104826, + "mean_norm/layer0": 10.877790868282318, + "mean_norm/layer1": 10.612155139446259, + "mean_norm/layer10": 10.95480102300644, + "mean_norm/layer11": 11.313199162483215, + "mean_norm/layer12": 11.961796998977661, + "mean_norm/layer13": 10.965710639953613, + "mean_norm/layer14": 11.390668153762817, + "mean_norm/layer15": 11.77765667438507, + "mean_norm/layer16": 11.043775260448456, + "mean_norm/layer17": 11.574420154094696, + "mean_norm/layer18": 11.052655577659607, + "mean_norm/layer19": 11.115290462970734, + "mean_norm/layer2": 9.02040845155716, + "mean_norm/layer20": 11.223563849925995, + "mean_norm/layer21": 11.186604678630829, + "mean_norm/layer22": 12.29665869474411, + "mean_norm/layer23": 12.245661318302155, + "mean_norm/layer3": 11.73361337184906, + "mean_norm/layer4": 10.354853808879852, + "mean_norm/layer5": 13.097476840019226, + "mean_norm/layer6": 9.801718294620514, + "mean_norm/layer7": 10.395187497138977, + "mean_norm/layer8": 10.942837297916412, + "mean_norm/layer9": 10.861369967460632, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11800 + }, + { + "epoch": 4.93, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4696624929525478, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.688814401626587, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8439, + "eval_samples_per_second": 20.348, + "eval_steps_per_second": 0.675, + "step": 11800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.95, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5014, + "max_norm": 37.93788528442383, + "max_norm/layer0": 29.340675354003906, + "max_norm/layer1": 31.018381118774414, + "max_norm/layer10": 32.511417388916016, + "max_norm/layer11": 30.187868118286133, + "max_norm/layer12": 34.35157775878906, + "max_norm/layer13": 30.132198333740234, + "max_norm/layer14": 31.31639289855957, + "max_norm/layer15": 37.80784606933594, + "max_norm/layer16": 31.25621795654297, + "max_norm/layer17": 37.93748474121094, + "max_norm/layer18": 32.988922119140625, + "max_norm/layer19": 32.515724182128906, + "max_norm/layer2": 23.931446075439453, + "max_norm/layer20": 33.02553939819336, + "max_norm/layer21": 32.86348342895508, + "max_norm/layer22": 33.67148208618164, + "max_norm/layer23": 31.935056686401367, + "max_norm/layer3": 30.043079376220703, + "max_norm/layer4": 29.730466842651367, + "max_norm/layer5": 37.93788528442383, + "max_norm/layer6": 25.02423667907715, + "max_norm/layer7": 32.552818298339844, + "max_norm/layer8": 31.76500701904297, + "max_norm/layer9": 31.92847442626953, + "mean_norm": 11.168228807548681, + "mean_norm/layer0": 10.890288770198822, + "mean_norm/layer1": 10.62157815694809, + "mean_norm/layer10": 10.963908910751343, + "mean_norm/layer11": 11.323238909244537, + "mean_norm/layer12": 11.974679410457611, + "mean_norm/layer13": 10.975349426269531, + "mean_norm/layer14": 11.401008605957031, + "mean_norm/layer15": 11.789547324180603, + "mean_norm/layer16": 11.053157031536102, + "mean_norm/layer17": 11.58478707075119, + "mean_norm/layer18": 11.061248421669006, + "mean_norm/layer19": 11.124230206012726, + "mean_norm/layer2": 9.023894667625427, + "mean_norm/layer20": 11.232537388801575, + "mean_norm/layer21": 11.19556349515915, + "mean_norm/layer22": 12.30886971950531, + "mean_norm/layer23": 12.257866203784943, + "mean_norm/layer3": 11.746358752250671, + "mean_norm/layer4": 10.362483322620392, + "mean_norm/layer5": 13.114296019077301, + "mean_norm/layer6": 9.807480454444885, + "mean_norm/layer7": 10.402803540229797, + "mean_norm/layer8": 10.952084362506866, + "mean_norm/layer9": 10.870231211185455, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11850 + }, + { + "epoch": 4.95, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4705872809205696, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.683215856552124, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6413, + "eval_samples_per_second": 20.702, + "eval_steps_per_second": 0.687, + "step": 11850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.97, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.519, + "max_norm": 38.05906295776367, + "max_norm/layer0": 29.42703628540039, + "max_norm/layer1": 31.089515686035156, + "max_norm/layer10": 32.583194732666016, + "max_norm/layer11": 30.255687713623047, + "max_norm/layer12": 34.46479797363281, + "max_norm/layer13": 30.210359573364258, + "max_norm/layer14": 31.400686264038086, + "max_norm/layer15": 37.92513656616211, + "max_norm/layer16": 31.335044860839844, + "max_norm/layer17": 38.05906295776367, + "max_norm/layer18": 33.082340240478516, + "max_norm/layer19": 32.62194061279297, + "max_norm/layer2": 24.000274658203125, + "max_norm/layer20": 33.11968994140625, + "max_norm/layer21": 32.96305847167969, + "max_norm/layer22": 33.76947021484375, + "max_norm/layer23": 32.0211181640625, + "max_norm/layer3": 30.126047134399414, + "max_norm/layer4": 29.8212947845459, + "max_norm/layer5": 38.0276985168457, + "max_norm/layer6": 25.084314346313477, + "max_norm/layer7": 32.645408630371094, + "max_norm/layer8": 31.83109474182129, + "max_norm/layer9": 32.01667022705078, + "mean_norm": 11.177929555376371, + "mean_norm/layer0": 10.902526676654816, + "mean_norm/layer1": 10.630789399147034, + "mean_norm/layer10": 10.972841262817383, + "mean_norm/layer11": 11.333194494247437, + "mean_norm/layer12": 11.987314462661743, + "mean_norm/layer13": 10.98465383052826, + "mean_norm/layer14": 11.411219239234924, + "mean_norm/layer15": 11.801235556602478, + "mean_norm/layer16": 11.062246561050415, + "mean_norm/layer17": 11.594827890396118, + "mean_norm/layer18": 11.069670617580414, + "mean_norm/layer19": 11.132874488830566, + "mean_norm/layer2": 9.027332544326782, + "mean_norm/layer20": 11.241263806819916, + "mean_norm/layer21": 11.204251945018768, + "mean_norm/layer22": 12.320836007595062, + "mean_norm/layer23": 12.269861817359924, + "mean_norm/layer3": 11.758853018283844, + "mean_norm/layer4": 10.370031774044037, + "mean_norm/layer5": 13.130874693393707, + "mean_norm/layer6": 9.813177287578583, + "mean_norm/layer7": 10.41031789779663, + "mean_norm/layer8": 10.961123704910278, + "mean_norm/layer9": 10.878990352153778, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11900 + }, + { + "epoch": 4.97, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4704128691546708, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6838083267211914, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6596, + "eval_samples_per_second": 20.67, + "eval_steps_per_second": 0.686, + "step": 11900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 4.99, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.5041, + "max_norm": 38.194522857666016, + "max_norm/layer0": 29.501251220703125, + "max_norm/layer1": 31.155527114868164, + "max_norm/layer10": 32.66633224487305, + "max_norm/layer11": 30.323793411254883, + "max_norm/layer12": 34.57496643066406, + "max_norm/layer13": 30.298030853271484, + "max_norm/layer14": 31.500028610229492, + "max_norm/layer15": 38.035335540771484, + "max_norm/layer16": 31.41799545288086, + "max_norm/layer17": 38.194522857666016, + "max_norm/layer18": 33.178749084472656, + "max_norm/layer19": 32.73746109008789, + "max_norm/layer2": 24.063013076782227, + "max_norm/layer20": 33.205509185791016, + "max_norm/layer21": 33.06170654296875, + "max_norm/layer22": 33.85256576538086, + "max_norm/layer23": 32.10818862915039, + "max_norm/layer3": 30.200939178466797, + "max_norm/layer4": 29.90153694152832, + "max_norm/layer5": 38.12092590332031, + "max_norm/layer6": 25.150123596191406, + "max_norm/layer7": 32.741180419921875, + "max_norm/layer8": 31.89752197265625, + "max_norm/layer9": 32.092933654785156, + "mean_norm": 11.187665241460005, + "mean_norm/layer0": 10.914686381816864, + "mean_norm/layer1": 10.640029609203339, + "mean_norm/layer10": 10.981725633144379, + "mean_norm/layer11": 11.343181252479553, + "mean_norm/layer12": 11.999892354011536, + "mean_norm/layer13": 10.993940532207489, + "mean_norm/layer14": 11.421403646469116, + "mean_norm/layer15": 11.812836050987244, + "mean_norm/layer16": 11.071481466293335, + "mean_norm/layer17": 11.604974210262299, + "mean_norm/layer18": 11.078194618225098, + "mean_norm/layer19": 11.141615271568298, + "mean_norm/layer2": 9.03076058626175, + "mean_norm/layer20": 11.250074625015259, + "mean_norm/layer21": 11.213150680065155, + "mean_norm/layer22": 12.33284342288971, + "mean_norm/layer23": 12.281926989555359, + "mean_norm/layer3": 11.771265745162964, + "mean_norm/layer4": 10.37760877609253, + "mean_norm/layer5": 13.147468388080597, + "mean_norm/layer6": 9.818911015987396, + "mean_norm/layer7": 10.417860507965088, + "mean_norm/layer8": 10.970265984535217, + "mean_norm/layer9": 10.887868046760559, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 11950 + }, + { + "epoch": 4.99, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4704534300304612, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6852517127990723, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6451, + "eval_samples_per_second": 20.695, + "eval_steps_per_second": 0.687, + "step": 11950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.01, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3794, + "max_norm": 38.302860260009766, + "max_norm/layer0": 29.574535369873047, + "max_norm/layer1": 31.22898292541504, + "max_norm/layer10": 32.7488899230957, + "max_norm/layer11": 30.39142608642578, + "max_norm/layer12": 34.67290496826172, + "max_norm/layer13": 30.389312744140625, + "max_norm/layer14": 31.585010528564453, + "max_norm/layer15": 38.15389633178711, + "max_norm/layer16": 31.482175827026367, + "max_norm/layer17": 38.302860260009766, + "max_norm/layer18": 33.27186965942383, + "max_norm/layer19": 32.84207534790039, + "max_norm/layer2": 24.129867553710938, + "max_norm/layer20": 33.300254821777344, + "max_norm/layer21": 33.150123596191406, + "max_norm/layer22": 33.929691314697266, + "max_norm/layer23": 32.196044921875, + "max_norm/layer3": 30.272613525390625, + "max_norm/layer4": 29.979124069213867, + "max_norm/layer5": 38.213741302490234, + "max_norm/layer6": 25.21087074279785, + "max_norm/layer7": 32.830772399902344, + "max_norm/layer8": 31.961711883544922, + "max_norm/layer9": 32.1682243347168, + "mean_norm": 11.19739151497682, + "mean_norm/layer0": 10.926727831363678, + "mean_norm/layer1": 10.64928013086319, + "mean_norm/layer10": 10.990540206432343, + "mean_norm/layer11": 11.35308039188385, + "mean_norm/layer12": 12.012557685375214, + "mean_norm/layer13": 11.003331005573273, + "mean_norm/layer14": 11.4315704703331, + "mean_norm/layer15": 11.824599802494049, + "mean_norm/layer16": 11.080740988254547, + "mean_norm/layer17": 11.61514014005661, + "mean_norm/layer18": 11.086707293987274, + "mean_norm/layer19": 11.150398910045624, + "mean_norm/layer2": 9.034183740615845, + "mean_norm/layer20": 11.259066879749298, + "mean_norm/layer21": 11.222183465957642, + "mean_norm/layer22": 12.344780445098877, + "mean_norm/layer23": 12.294032156467438, + "mean_norm/layer3": 11.783682465553284, + "mean_norm/layer4": 10.38510811328888, + "mean_norm/layer5": 13.16391259431839, + "mean_norm/layer6": 9.824450016021729, + "mean_norm/layer7": 10.425398409366608, + "mean_norm/layer8": 10.979355573654175, + "mean_norm/layer9": 10.896567642688751, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12000 + }, + { + "epoch": 5.01, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46842944232851874, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.722437858581543, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6518, + "eval_samples_per_second": 20.684, + "eval_steps_per_second": 0.687, + "step": 12000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.03, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3033, + "max_norm": 38.435333251953125, + "max_norm/layer0": 29.649662017822266, + "max_norm/layer1": 31.303651809692383, + "max_norm/layer10": 32.83454895019531, + "max_norm/layer11": 30.47419548034668, + "max_norm/layer12": 34.7756462097168, + "max_norm/layer13": 30.48672103881836, + "max_norm/layer14": 31.663904190063477, + "max_norm/layer15": 38.27345657348633, + "max_norm/layer16": 31.572792053222656, + "max_norm/layer17": 38.435333251953125, + "max_norm/layer18": 33.37535095214844, + "max_norm/layer19": 32.94023895263672, + "max_norm/layer2": 24.199243545532227, + "max_norm/layer20": 33.396766662597656, + "max_norm/layer21": 33.266395568847656, + "max_norm/layer22": 34.011863708496094, + "max_norm/layer23": 32.28325653076172, + "max_norm/layer3": 30.342016220092773, + "max_norm/layer4": 30.060850143432617, + "max_norm/layer5": 38.307411193847656, + "max_norm/layer6": 25.27783203125, + "max_norm/layer7": 32.91995620727539, + "max_norm/layer8": 32.02895736694336, + "max_norm/layer9": 32.24490737915039, + "mean_norm": 11.207477805515131, + "mean_norm/layer0": 10.939489781856537, + "mean_norm/layer1": 10.658688187599182, + "mean_norm/layer10": 10.99948763847351, + "mean_norm/layer11": 11.363388180732727, + "mean_norm/layer12": 12.025580883026123, + "mean_norm/layer13": 11.013049066066742, + "mean_norm/layer14": 11.442092716693878, + "mean_norm/layer15": 11.836634337902069, + "mean_norm/layer16": 11.090266406536102, + "mean_norm/layer17": 11.625772356987, + "mean_norm/layer18": 11.095670282840729, + "mean_norm/layer19": 11.15985506772995, + "mean_norm/layer2": 9.037715494632721, + "mean_norm/layer20": 11.268753230571747, + "mean_norm/layer21": 11.231657326221466, + "mean_norm/layer22": 12.357149720191956, + "mean_norm/layer23": 12.30664312839508, + "mean_norm/layer3": 11.796434462070465, + "mean_norm/layer4": 10.392972588539124, + "mean_norm/layer5": 13.180622637271881, + "mean_norm/layer6": 9.830242931842804, + "mean_norm/layer7": 10.433066010475159, + "mean_norm/layer8": 10.988660275936127, + "mean_norm/layer9": 10.90557461977005, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12050 + }, + { + "epoch": 5.03, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46702197993859085, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7288458347320557, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.849, + "eval_samples_per_second": 20.339, + "eval_steps_per_second": 0.675, + "step": 12050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.05, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3092, + "max_norm": 38.57270812988281, + "max_norm/layer0": 29.720144271850586, + "max_norm/layer1": 31.386343002319336, + "max_norm/layer10": 32.91311264038086, + "max_norm/layer11": 30.554622650146484, + "max_norm/layer12": 34.88260269165039, + "max_norm/layer13": 30.58049774169922, + "max_norm/layer14": 31.75419044494629, + "max_norm/layer15": 38.385005950927734, + "max_norm/layer16": 31.658222198486328, + "max_norm/layer17": 38.57270812988281, + "max_norm/layer18": 33.51114273071289, + "max_norm/layer19": 33.040367126464844, + "max_norm/layer2": 24.25741195678711, + "max_norm/layer20": 33.488975524902344, + "max_norm/layer21": 33.363487243652344, + "max_norm/layer22": 34.08940505981445, + "max_norm/layer23": 32.368831634521484, + "max_norm/layer3": 30.41705894470215, + "max_norm/layer4": 30.137144088745117, + "max_norm/layer5": 38.41334533691406, + "max_norm/layer6": 25.35138702392578, + "max_norm/layer7": 33.001834869384766, + "max_norm/layer8": 32.105072021484375, + "max_norm/layer9": 32.34452438354492, + "mean_norm": 11.21775616457065, + "mean_norm/layer0": 10.952854812145233, + "mean_norm/layer1": 10.668235659599304, + "mean_norm/layer10": 11.008642077445984, + "mean_norm/layer11": 11.373880326747894, + "mean_norm/layer12": 12.038914799690247, + "mean_norm/layer13": 11.02297329902649, + "mean_norm/layer14": 11.452847063541412, + "mean_norm/layer15": 11.848887979984283, + "mean_norm/layer16": 11.099906980991364, + "mean_norm/layer17": 11.636568486690521, + "mean_norm/layer18": 11.10478299856186, + "mean_norm/layer19": 11.169407188892365, + "mean_norm/layer2": 9.04135924577713, + "mean_norm/layer20": 11.278404533863068, + "mean_norm/layer21": 11.241189360618591, + "mean_norm/layer22": 12.369754791259766, + "mean_norm/layer23": 12.31940084695816, + "mean_norm/layer3": 11.80949753522873, + "mean_norm/layer4": 10.400984764099121, + "mean_norm/layer5": 13.19771432876587, + "mean_norm/layer6": 9.83626252412796, + "mean_norm/layer7": 10.44089788198471, + "mean_norm/layer8": 10.998125731945038, + "mean_norm/layer9": 10.914654731750488, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12100 + }, + { + "epoch": 5.05, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46599173369351393, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7484076023101807, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8461, + "eval_samples_per_second": 20.344, + "eval_steps_per_second": 0.675, + "step": 12100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.07, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3214, + "max_norm": 38.711116790771484, + "max_norm/layer0": 29.78860092163086, + "max_norm/layer1": 31.47394561767578, + "max_norm/layer10": 33.007537841796875, + "max_norm/layer11": 30.644929885864258, + "max_norm/layer12": 34.98715591430664, + "max_norm/layer13": 30.685518264770508, + "max_norm/layer14": 31.84963035583496, + "max_norm/layer15": 38.483680725097656, + "max_norm/layer16": 31.737163543701172, + "max_norm/layer17": 38.711116790771484, + "max_norm/layer18": 33.6363639831543, + "max_norm/layer19": 33.14191818237305, + "max_norm/layer2": 24.332351684570312, + "max_norm/layer20": 33.56949234008789, + "max_norm/layer21": 33.465484619140625, + "max_norm/layer22": 34.195106506347656, + "max_norm/layer23": 32.45437240600586, + "max_norm/layer3": 30.49375343322754, + "max_norm/layer4": 30.231184005737305, + "max_norm/layer5": 38.51918029785156, + "max_norm/layer6": 25.419851303100586, + "max_norm/layer7": 33.08552551269531, + "max_norm/layer8": 32.17802810668945, + "max_norm/layer9": 32.42779541015625, + "mean_norm": 11.228026956319809, + "mean_norm/layer0": 10.966456592082977, + "mean_norm/layer1": 10.677858173847198, + "mean_norm/layer10": 11.017882645130157, + "mean_norm/layer11": 11.384362578392029, + "mean_norm/layer12": 12.052213430404663, + "mean_norm/layer13": 11.032799184322357, + "mean_norm/layer14": 11.463645279407501, + "mean_norm/layer15": 11.861131072044373, + "mean_norm/layer16": 11.109526216983795, + "mean_norm/layer17": 11.647267878055573, + "mean_norm/layer18": 11.113752365112305, + "mean_norm/layer19": 11.178877294063568, + "mean_norm/layer2": 9.04505831003189, + "mean_norm/layer20": 11.28793090581894, + "mean_norm/layer21": 11.250765681266785, + "mean_norm/layer22": 12.382255971431732, + "mean_norm/layer23": 12.33215218782425, + "mean_norm/layer3": 11.82255333662033, + "mean_norm/layer4": 10.40901243686676, + "mean_norm/layer5": 13.214745044708252, + "mean_norm/layer6": 9.842304766178131, + "mean_norm/layer7": 10.448727905750275, + "mean_norm/layer8": 11.007568538188934, + "mean_norm/layer9": 10.92379915714264, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12150 + }, + { + "epoch": 5.07, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4671112138653298, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7360055446624756, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6542, + "eval_samples_per_second": 20.679, + "eval_steps_per_second": 0.686, + "step": 12150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.09, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3385, + "max_norm": 38.83620834350586, + "max_norm/layer0": 29.86420440673828, + "max_norm/layer1": 31.559425354003906, + "max_norm/layer10": 33.10588073730469, + "max_norm/layer11": 30.738574981689453, + "max_norm/layer12": 35.08659362792969, + "max_norm/layer13": 30.78911781311035, + "max_norm/layer14": 31.945295333862305, + "max_norm/layer15": 38.5927848815918, + "max_norm/layer16": 31.82872200012207, + "max_norm/layer17": 38.83620834350586, + "max_norm/layer18": 33.7295036315918, + "max_norm/layer19": 33.2426643371582, + "max_norm/layer2": 24.397293090820312, + "max_norm/layer20": 33.64811706542969, + "max_norm/layer21": 33.56774139404297, + "max_norm/layer22": 34.284812927246094, + "max_norm/layer23": 32.54706954956055, + "max_norm/layer3": 30.576663970947266, + "max_norm/layer4": 30.337905883789062, + "max_norm/layer5": 38.61861038208008, + "max_norm/layer6": 25.4854736328125, + "max_norm/layer7": 33.1692008972168, + "max_norm/layer8": 32.24501419067383, + "max_norm/layer9": 32.51561737060547, + "mean_norm": 11.23827119419972, + "mean_norm/layer0": 10.980204999446869, + "mean_norm/layer1": 10.687390863895416, + "mean_norm/layer10": 11.027082443237305, + "mean_norm/layer11": 11.394726574420929, + "mean_norm/layer12": 12.06546550989151, + "mean_norm/layer13": 11.042561769485474, + "mean_norm/layer14": 11.474426746368408, + "mean_norm/layer15": 11.873374342918396, + "mean_norm/layer16": 11.119168400764465, + "mean_norm/layer17": 11.657908141613007, + "mean_norm/layer18": 11.122701942920685, + "mean_norm/layer19": 11.188299894332886, + "mean_norm/layer2": 9.04871541261673, + "mean_norm/layer20": 11.297274112701416, + "mean_norm/layer21": 11.260233700275421, + "mean_norm/layer22": 12.394688069820404, + "mean_norm/layer23": 12.344739496707916, + "mean_norm/layer3": 11.835649728775024, + "mean_norm/layer4": 10.417012393474579, + "mean_norm/layer5": 13.231845915317535, + "mean_norm/layer6": 9.848419427871704, + "mean_norm/layer7": 10.456669807434082, + "mean_norm/layer8": 11.017016351222992, + "mean_norm/layer9": 10.932932615280151, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12200 + }, + { + "epoch": 5.09, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4663283889625745, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7343714237213135, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8312, + "eval_samples_per_second": 20.37, + "eval_steps_per_second": 0.676, + "step": 12200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.11, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3454, + "max_norm": 38.94695281982422, + "max_norm/layer0": 29.94550895690918, + "max_norm/layer1": 31.643796920776367, + "max_norm/layer10": 33.20231246948242, + "max_norm/layer11": 30.815670013427734, + "max_norm/layer12": 35.189117431640625, + "max_norm/layer13": 30.878437042236328, + "max_norm/layer14": 32.03306198120117, + "max_norm/layer15": 38.69236373901367, + "max_norm/layer16": 31.911941528320312, + "max_norm/layer17": 38.94695281982422, + "max_norm/layer18": 33.80670928955078, + "max_norm/layer19": 33.32986068725586, + "max_norm/layer2": 24.444849014282227, + "max_norm/layer20": 33.73457717895508, + "max_norm/layer21": 33.681278228759766, + "max_norm/layer22": 34.373939514160156, + "max_norm/layer23": 32.62388229370117, + "max_norm/layer3": 30.654300689697266, + "max_norm/layer4": 30.43708038330078, + "max_norm/layer5": 38.72135925292969, + "max_norm/layer6": 25.56049156188965, + "max_norm/layer7": 33.244224548339844, + "max_norm/layer8": 32.313419342041016, + "max_norm/layer9": 32.6116943359375, + "mean_norm": 11.248527511954308, + "mean_norm/layer0": 10.99410879611969, + "mean_norm/layer1": 10.696984589099884, + "mean_norm/layer10": 11.036336183547974, + "mean_norm/layer11": 11.405112087726593, + "mean_norm/layer12": 12.078685998916626, + "mean_norm/layer13": 11.052375078201294, + "mean_norm/layer14": 11.485212564468384, + "mean_norm/layer15": 11.88576340675354, + "mean_norm/layer16": 11.128781139850616, + "mean_norm/layer17": 11.668495118618011, + "mean_norm/layer18": 11.131764531135559, + "mean_norm/layer19": 11.197697877883911, + "mean_norm/layer2": 9.05235469341278, + "mean_norm/layer20": 11.306506991386414, + "mean_norm/layer21": 11.269656121730804, + "mean_norm/layer22": 12.406981706619263, + "mean_norm/layer23": 12.357316255569458, + "mean_norm/layer3": 11.848814308643341, + "mean_norm/layer4": 10.424997925758362, + "mean_norm/layer5": 13.248937249183655, + "mean_norm/layer6": 9.85450428724289, + "mean_norm/layer7": 10.464615046977997, + "mean_norm/layer8": 11.02652508020401, + "mean_norm/layer9": 10.942133247852325, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12250 + }, + { + "epoch": 5.11, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4667056051074255, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.738703489303589, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8467, + "eval_samples_per_second": 20.343, + "eval_steps_per_second": 0.675, + "step": 12250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.14, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3659, + "max_norm": 39.07551956176758, + "max_norm/layer0": 30.023889541625977, + "max_norm/layer1": 31.72894287109375, + "max_norm/layer10": 33.298709869384766, + "max_norm/layer11": 30.895883560180664, + "max_norm/layer12": 35.28593444824219, + "max_norm/layer13": 30.964996337890625, + "max_norm/layer14": 32.12107849121094, + "max_norm/layer15": 38.7972412109375, + "max_norm/layer16": 32.01172637939453, + "max_norm/layer17": 39.07551956176758, + "max_norm/layer18": 33.89895248413086, + "max_norm/layer19": 33.43098449707031, + "max_norm/layer2": 24.488872528076172, + "max_norm/layer20": 33.816402435302734, + "max_norm/layer21": 33.77363586425781, + "max_norm/layer22": 34.466548919677734, + "max_norm/layer23": 32.704017639160156, + "max_norm/layer3": 30.721336364746094, + "max_norm/layer4": 30.511106491088867, + "max_norm/layer5": 38.81980895996094, + "max_norm/layer6": 25.633987426757812, + "max_norm/layer7": 33.3271598815918, + "max_norm/layer8": 32.375736236572266, + "max_norm/layer9": 32.68894958496094, + "mean_norm": 11.258795611560345, + "mean_norm/layer0": 11.00811630487442, + "mean_norm/layer1": 10.706629991531372, + "mean_norm/layer10": 11.045571565628052, + "mean_norm/layer11": 11.415521442890167, + "mean_norm/layer12": 12.091852962970734, + "mean_norm/layer13": 11.062187731266022, + "mean_norm/layer14": 11.495945274829865, + "mean_norm/layer15": 11.898083865642548, + "mean_norm/layer16": 11.138496458530426, + "mean_norm/layer17": 11.679109454154968, + "mean_norm/layer18": 11.14063447713852, + "mean_norm/layer19": 11.207036793231964, + "mean_norm/layer2": 9.056014776229858, + "mean_norm/layer20": 11.315796852111816, + "mean_norm/layer21": 11.279004096984863, + "mean_norm/layer22": 12.419390439987183, + "mean_norm/layer23": 12.369924485683441, + "mean_norm/layer3": 11.862018048763275, + "mean_norm/layer4": 10.433027982711792, + "mean_norm/layer5": 13.266180872917175, + "mean_norm/layer6": 9.860602617263794, + "mean_norm/layer7": 10.472546875476837, + "mean_norm/layer8": 11.036045849323273, + "mean_norm/layer9": 10.951355457305908, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12300 + }, + { + "epoch": 5.14, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46643790332720864, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.738595724105835, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8552, + "eval_samples_per_second": 20.329, + "eval_steps_per_second": 0.675, + "step": 12300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.16, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3723, + "max_norm": 39.21499252319336, + "max_norm/layer0": 30.096342086791992, + "max_norm/layer1": 31.81536293029785, + "max_norm/layer10": 33.39365005493164, + "max_norm/layer11": 30.970529556274414, + "max_norm/layer12": 35.38508605957031, + "max_norm/layer13": 31.051616668701172, + "max_norm/layer14": 32.2015266418457, + "max_norm/layer15": 38.904335021972656, + "max_norm/layer16": 32.10439682006836, + "max_norm/layer17": 39.21499252319336, + "max_norm/layer18": 33.9943733215332, + "max_norm/layer19": 33.54290771484375, + "max_norm/layer2": 24.53144645690918, + "max_norm/layer20": 33.91130065917969, + "max_norm/layer21": 33.88111114501953, + "max_norm/layer22": 34.56108093261719, + "max_norm/layer23": 32.789222717285156, + "max_norm/layer3": 30.79220962524414, + "max_norm/layer4": 30.591642379760742, + "max_norm/layer5": 38.921443939208984, + "max_norm/layer6": 25.69824981689453, + "max_norm/layer7": 33.40739440917969, + "max_norm/layer8": 32.45912551879883, + "max_norm/layer9": 32.77835464477539, + "mean_norm": 11.269128928581873, + "mean_norm/layer0": 11.022284209728241, + "mean_norm/layer1": 10.716285347938538, + "mean_norm/layer10": 11.054743885993958, + "mean_norm/layer11": 11.426034033298492, + "mean_norm/layer12": 12.105147123336792, + "mean_norm/layer13": 11.072054088115692, + "mean_norm/layer14": 11.506755590438843, + "mean_norm/layer15": 11.91039365530014, + "mean_norm/layer16": 11.14819085597992, + "mean_norm/layer17": 11.689731240272522, + "mean_norm/layer18": 11.149564683437347, + "mean_norm/layer19": 11.216427028179169, + "mean_norm/layer2": 9.059784173965454, + "mean_norm/layer20": 11.325107753276825, + "mean_norm/layer21": 11.28848946094513, + "mean_norm/layer22": 12.431827366352081, + "mean_norm/layer23": 12.38248485326767, + "mean_norm/layer3": 11.875406265258789, + "mean_norm/layer4": 10.441197097301483, + "mean_norm/layer5": 13.283584535121918, + "mean_norm/layer6": 9.866783261299133, + "mean_norm/layer7": 10.480609238147736, + "mean_norm/layer8": 11.04563707113266, + "mean_norm/layer9": 10.960571467876434, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12350 + }, + { + "epoch": 5.16, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46718422344175253, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7359020709991455, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8471, + "eval_samples_per_second": 20.342, + "eval_steps_per_second": 0.675, + "step": 12350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.18, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3804, + "max_norm": 39.340614318847656, + "max_norm/layer0": 30.16893196105957, + "max_norm/layer1": 31.899879455566406, + "max_norm/layer10": 33.48374557495117, + "max_norm/layer11": 31.040555953979492, + "max_norm/layer12": 35.49278259277344, + "max_norm/layer13": 31.146411895751953, + "max_norm/layer14": 32.291934967041016, + "max_norm/layer15": 39.00080108642578, + "max_norm/layer16": 32.20722198486328, + "max_norm/layer17": 39.340614318847656, + "max_norm/layer18": 34.10038757324219, + "max_norm/layer19": 33.632362365722656, + "max_norm/layer2": 24.594600677490234, + "max_norm/layer20": 33.99564743041992, + "max_norm/layer21": 33.98853302001953, + "max_norm/layer22": 34.644447326660156, + "max_norm/layer23": 32.86933135986328, + "max_norm/layer3": 30.86780548095703, + "max_norm/layer4": 30.658416748046875, + "max_norm/layer5": 39.01528549194336, + "max_norm/layer6": 25.761075973510742, + "max_norm/layer7": 33.47981643676758, + "max_norm/layer8": 32.54744338989258, + "max_norm/layer9": 32.88261413574219, + "mean_norm": 11.279446867605051, + "mean_norm/layer0": 11.036405384540558, + "mean_norm/layer1": 10.72603064775467, + "mean_norm/layer10": 11.063933193683624, + "mean_norm/layer11": 11.436520993709564, + "mean_norm/layer12": 12.118435442447662, + "mean_norm/layer13": 11.082020878791809, + "mean_norm/layer14": 11.517515301704407, + "mean_norm/layer15": 11.922657191753387, + "mean_norm/layer16": 11.157944202423096, + "mean_norm/layer17": 11.700325787067413, + "mean_norm/layer18": 11.158488869667053, + "mean_norm/layer19": 11.225876986980438, + "mean_norm/layer2": 9.06354033946991, + "mean_norm/layer20": 11.334345400333405, + "mean_norm/layer21": 11.297895312309265, + "mean_norm/layer22": 12.444255292415619, + "mean_norm/layer23": 12.39496910572052, + "mean_norm/layer3": 11.888732671737671, + "mean_norm/layer4": 10.449354648590088, + "mean_norm/layer5": 13.300997972488403, + "mean_norm/layer6": 9.872974157333374, + "mean_norm/layer7": 10.488583147525787, + "mean_norm/layer8": 11.055160284042358, + "mean_norm/layer9": 10.969761610031128, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12400 + }, + { + "epoch": 5.18, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46694897036216804, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7420947551727295, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8371, + "eval_samples_per_second": 20.36, + "eval_steps_per_second": 0.676, + "step": 12400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.2, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.374, + "max_norm": 39.4640998840332, + "max_norm/layer0": 30.24111557006836, + "max_norm/layer1": 31.98891830444336, + "max_norm/layer10": 33.58835983276367, + "max_norm/layer11": 31.11510467529297, + "max_norm/layer12": 35.58452224731445, + "max_norm/layer13": 31.24594497680664, + "max_norm/layer14": 32.39015579223633, + "max_norm/layer15": 39.09994888305664, + "max_norm/layer16": 32.305450439453125, + "max_norm/layer17": 39.4640998840332, + "max_norm/layer18": 34.1920166015625, + "max_norm/layer19": 33.718265533447266, + "max_norm/layer2": 24.64690589904785, + "max_norm/layer20": 34.07452392578125, + "max_norm/layer21": 34.084495544433594, + "max_norm/layer22": 34.735374450683594, + "max_norm/layer23": 32.95333480834961, + "max_norm/layer3": 30.938343048095703, + "max_norm/layer4": 30.739850997924805, + "max_norm/layer5": 39.114383697509766, + "max_norm/layer6": 25.823427200317383, + "max_norm/layer7": 33.55558395385742, + "max_norm/layer8": 32.629051208496094, + "max_norm/layer9": 32.965084075927734, + "mean_norm": 11.289606223503748, + "mean_norm/layer0": 11.050397753715515, + "mean_norm/layer1": 10.735670387744904, + "mean_norm/layer10": 11.073055744171143, + "mean_norm/layer11": 11.446790933609009, + "mean_norm/layer12": 12.131577014923096, + "mean_norm/layer13": 11.091777503490448, + "mean_norm/layer14": 11.528154075145721, + "mean_norm/layer15": 11.934624075889587, + "mean_norm/layer16": 11.167495727539062, + "mean_norm/layer17": 11.710758984088898, + "mean_norm/layer18": 11.16724556684494, + "mean_norm/layer19": 11.23505425453186, + "mean_norm/layer2": 9.067234516143799, + "mean_norm/layer20": 11.343270659446716, + "mean_norm/layer21": 11.307054281234741, + "mean_norm/layer22": 12.456541776657104, + "mean_norm/layer23": 12.407329261302948, + "mean_norm/layer3": 11.901857256889343, + "mean_norm/layer4": 10.45742917060852, + "mean_norm/layer5": 13.318169116973877, + "mean_norm/layer6": 9.879100859165192, + "mean_norm/layer7": 10.496457755565643, + "mean_norm/layer8": 11.064581274986267, + "mean_norm/layer9": 10.97892141342163, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12450 + }, + { + "epoch": 5.2, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46639734245141823, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.733039379119873, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8446, + "eval_samples_per_second": 20.347, + "eval_steps_per_second": 0.675, + "step": 12450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.22, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3609, + "max_norm": 39.59554672241211, + "max_norm/layer0": 30.308876037597656, + "max_norm/layer1": 32.06950378417969, + "max_norm/layer10": 33.700904846191406, + "max_norm/layer11": 31.186481475830078, + "max_norm/layer12": 35.678646087646484, + "max_norm/layer13": 31.349061965942383, + "max_norm/layer14": 32.47747039794922, + "max_norm/layer15": 39.23009490966797, + "max_norm/layer16": 32.39930725097656, + "max_norm/layer17": 39.59554672241211, + "max_norm/layer18": 34.284759521484375, + "max_norm/layer19": 33.8138313293457, + "max_norm/layer2": 24.689485549926758, + "max_norm/layer20": 34.164310455322266, + "max_norm/layer21": 34.197967529296875, + "max_norm/layer22": 34.82883834838867, + "max_norm/layer23": 33.03238296508789, + "max_norm/layer3": 31.01808738708496, + "max_norm/layer4": 30.82036590576172, + "max_norm/layer5": 39.21382522583008, + "max_norm/layer6": 25.887048721313477, + "max_norm/layer7": 33.6284065246582, + "max_norm/layer8": 32.720245361328125, + "max_norm/layer9": 33.05253601074219, + "mean_norm": 11.29996439566215, + "mean_norm/layer0": 11.064708232879639, + "mean_norm/layer1": 10.745510697364807, + "mean_norm/layer10": 11.082452714443207, + "mean_norm/layer11": 11.457266986370087, + "mean_norm/layer12": 12.14503288269043, + "mean_norm/layer13": 11.101730048656464, + "mean_norm/layer14": 11.539036452770233, + "mean_norm/layer15": 11.946848630905151, + "mean_norm/layer16": 11.177112400531769, + "mean_norm/layer17": 11.721317291259766, + "mean_norm/layer18": 11.176118850708008, + "mean_norm/layer19": 11.24438202381134, + "mean_norm/layer2": 9.071042716503143, + "mean_norm/layer20": 11.352453172206879, + "mean_norm/layer21": 11.316423892974854, + "mean_norm/layer22": 12.468946397304535, + "mean_norm/layer23": 12.419977307319641, + "mean_norm/layer3": 11.915303409099579, + "mean_norm/layer4": 10.465545892715454, + "mean_norm/layer5": 13.335692644119263, + "mean_norm/layer6": 9.885368764400482, + "mean_norm/layer7": 10.50448876619339, + "mean_norm/layer8": 11.074171483516693, + "mean_norm/layer9": 10.988213837146759, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12500 + }, + { + "epoch": 5.22, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46689218513606145, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7314534187316895, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.652, + "eval_samples_per_second": 20.683, + "eval_steps_per_second": 0.687, + "step": 12500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.24, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3862, + "max_norm": 39.70277404785156, + "max_norm/layer0": 30.38404083251953, + "max_norm/layer1": 32.14478302001953, + "max_norm/layer10": 33.805885314941406, + "max_norm/layer11": 31.260480880737305, + "max_norm/layer12": 35.794734954833984, + "max_norm/layer13": 31.43575096130371, + "max_norm/layer14": 32.58359909057617, + "max_norm/layer15": 39.35628128051758, + "max_norm/layer16": 32.494712829589844, + "max_norm/layer17": 39.70277404785156, + "max_norm/layer18": 34.3810920715332, + "max_norm/layer19": 33.91523361206055, + "max_norm/layer2": 24.739246368408203, + "max_norm/layer20": 34.25129699707031, + "max_norm/layer21": 34.31393051147461, + "max_norm/layer22": 34.92304611206055, + "max_norm/layer23": 33.12150573730469, + "max_norm/layer3": 31.105815887451172, + "max_norm/layer4": 30.906110763549805, + "max_norm/layer5": 39.31342697143555, + "max_norm/layer6": 25.954769134521484, + "max_norm/layer7": 33.6923713684082, + "max_norm/layer8": 32.806705474853516, + "max_norm/layer9": 33.13435745239258, + "mean_norm": 11.310173459351063, + "mean_norm/layer0": 11.078775227069855, + "mean_norm/layer1": 10.755265414714813, + "mean_norm/layer10": 11.091667652130127, + "mean_norm/layer11": 11.467542886734009, + "mean_norm/layer12": 12.158098638057709, + "mean_norm/layer13": 11.111486971378326, + "mean_norm/layer14": 11.549628913402557, + "mean_norm/layer15": 11.958956837654114, + "mean_norm/layer16": 11.186640977859497, + "mean_norm/layer17": 11.731778621673584, + "mean_norm/layer18": 11.184843063354492, + "mean_norm/layer19": 11.253638625144958, + "mean_norm/layer2": 9.074791491031647, + "mean_norm/layer20": 11.361482739448547, + "mean_norm/layer21": 11.32561457157135, + "mean_norm/layer22": 12.481294214725494, + "mean_norm/layer23": 12.432406663894653, + "mean_norm/layer3": 11.928609669208527, + "mean_norm/layer4": 10.473615765571594, + "mean_norm/layer5": 13.353126347064972, + "mean_norm/layer6": 9.891473472118378, + "mean_norm/layer7": 10.512412011623383, + "mean_norm/layer8": 11.083585619926453, + "mean_norm/layer9": 10.997426629066467, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12550 + }, + { + "epoch": 5.24, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46764661742576347, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.731708288192749, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8512, + "eval_samples_per_second": 20.335, + "eval_steps_per_second": 0.675, + "step": 12550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.26, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3884, + "max_norm": 39.81848907470703, + "max_norm/layer0": 30.465442657470703, + "max_norm/layer1": 32.21744155883789, + "max_norm/layer10": 33.90283203125, + "max_norm/layer11": 31.341875076293945, + "max_norm/layer12": 35.89216995239258, + "max_norm/layer13": 31.522750854492188, + "max_norm/layer14": 32.66755676269531, + "max_norm/layer15": 39.477203369140625, + "max_norm/layer16": 32.581642150878906, + "max_norm/layer17": 39.81848907470703, + "max_norm/layer18": 34.4770393371582, + "max_norm/layer19": 34.00304412841797, + "max_norm/layer2": 24.784198760986328, + "max_norm/layer20": 34.34490966796875, + "max_norm/layer21": 34.41489791870117, + "max_norm/layer22": 35.03091812133789, + "max_norm/layer23": 33.20782470703125, + "max_norm/layer3": 31.18351173400879, + "max_norm/layer4": 30.99317169189453, + "max_norm/layer5": 39.4189567565918, + "max_norm/layer6": 26.01103401184082, + "max_norm/layer7": 33.767051696777344, + "max_norm/layer8": 32.885719299316406, + "max_norm/layer9": 33.21125793457031, + "mean_norm": 11.320386427144209, + "mean_norm/layer0": 11.092981338500977, + "mean_norm/layer1": 10.765110731124878, + "mean_norm/layer10": 11.1008420586586, + "mean_norm/layer11": 11.477921664714813, + "mean_norm/layer12": 12.171100318431854, + "mean_norm/layer13": 11.121250987052917, + "mean_norm/layer14": 11.560356736183167, + "mean_norm/layer15": 11.971032798290253, + "mean_norm/layer16": 11.196124851703644, + "mean_norm/layer17": 11.742257952690125, + "mean_norm/layer18": 11.193524301052094, + "mean_norm/layer19": 11.262769341468811, + "mean_norm/layer2": 9.07853776216507, + "mean_norm/layer20": 11.370389938354492, + "mean_norm/layer21": 11.334768116474152, + "mean_norm/layer22": 12.493632674217224, + "mean_norm/layer23": 12.444727778434753, + "mean_norm/layer3": 11.94198340177536, + "mean_norm/layer4": 10.481647431850433, + "mean_norm/layer5": 13.370624423027039, + "mean_norm/layer6": 9.897690117359161, + "mean_norm/layer7": 10.52032458782196, + "mean_norm/layer8": 11.093088150024414, + "mean_norm/layer9": 11.006586790084839, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12600 + }, + { + "epoch": 5.26, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4682955914384103, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7252254486083984, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8473, + "eval_samples_per_second": 20.342, + "eval_steps_per_second": 0.675, + "step": 12600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.28, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4032, + "max_norm": 39.929420471191406, + "max_norm/layer0": 30.548931121826172, + "max_norm/layer1": 32.29167175292969, + "max_norm/layer10": 34.00247573852539, + "max_norm/layer11": 31.41254997253418, + "max_norm/layer12": 35.99769973754883, + "max_norm/layer13": 31.61075210571289, + "max_norm/layer14": 32.75844192504883, + "max_norm/layer15": 39.58732986450195, + "max_norm/layer16": 32.66705322265625, + "max_norm/layer17": 39.929420471191406, + "max_norm/layer18": 34.565277099609375, + "max_norm/layer19": 34.10858917236328, + "max_norm/layer2": 24.823476791381836, + "max_norm/layer20": 34.442203521728516, + "max_norm/layer21": 34.50871658325195, + "max_norm/layer22": 35.11521530151367, + "max_norm/layer23": 33.29035186767578, + "max_norm/layer3": 31.250028610229492, + "max_norm/layer4": 31.078842163085938, + "max_norm/layer5": 39.521339416503906, + "max_norm/layer6": 26.063798904418945, + "max_norm/layer7": 33.84354782104492, + "max_norm/layer8": 32.952308654785156, + "max_norm/layer9": 33.28911209106445, + "mean_norm": 11.33057057360808, + "mean_norm/layer0": 11.107169270515442, + "mean_norm/layer1": 10.774906635284424, + "mean_norm/layer10": 11.110038161277771, + "mean_norm/layer11": 11.488389551639557, + "mean_norm/layer12": 12.184193432331085, + "mean_norm/layer13": 11.13099753856659, + "mean_norm/layer14": 11.571000754833221, + "mean_norm/layer15": 11.983158111572266, + "mean_norm/layer16": 11.205597698688507, + "mean_norm/layer17": 11.75269091129303, + "mean_norm/layer18": 11.20217877626419, + "mean_norm/layer19": 11.271834790706635, + "mean_norm/layer2": 9.082184433937073, + "mean_norm/layer20": 11.379377901554108, + "mean_norm/layer21": 11.343716561794281, + "mean_norm/layer22": 12.505850672721863, + "mean_norm/layer23": 12.457082509994507, + "mean_norm/layer3": 11.95522665977478, + "mean_norm/layer4": 10.489646911621094, + "mean_norm/layer5": 13.388073563575745, + "mean_norm/layer6": 9.903882265090942, + "mean_norm/layer7": 10.528180718421936, + "mean_norm/layer8": 11.102473735809326, + "mean_norm/layer9": 11.015842199325562, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12650 + }, + { + "epoch": 5.28, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46865252714536615, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7251226902008057, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8478, + "eval_samples_per_second": 20.341, + "eval_steps_per_second": 0.675, + "step": 12650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.3, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3873, + "max_norm": 40.05979919433594, + "max_norm/layer0": 30.627132415771484, + "max_norm/layer1": 32.355186462402344, + "max_norm/layer10": 34.118804931640625, + "max_norm/layer11": 31.481056213378906, + "max_norm/layer12": 36.096923828125, + "max_norm/layer13": 31.706356048583984, + "max_norm/layer14": 32.84482192993164, + "max_norm/layer15": 39.70392608642578, + "max_norm/layer16": 32.7635498046875, + "max_norm/layer17": 40.05979919433594, + "max_norm/layer18": 34.661746978759766, + "max_norm/layer19": 34.22161102294922, + "max_norm/layer2": 24.860652923583984, + "max_norm/layer20": 34.532554626464844, + "max_norm/layer21": 34.61908721923828, + "max_norm/layer22": 35.19852066040039, + "max_norm/layer23": 33.36899185180664, + "max_norm/layer3": 31.320377349853516, + "max_norm/layer4": 31.162757873535156, + "max_norm/layer5": 39.61590576171875, + "max_norm/layer6": 26.116485595703125, + "max_norm/layer7": 33.92621994018555, + "max_norm/layer8": 33.02066421508789, + "max_norm/layer9": 33.36391830444336, + "mean_norm": 11.340739885965982, + "mean_norm/layer0": 11.121292233467102, + "mean_norm/layer1": 10.784716546535492, + "mean_norm/layer10": 11.11919617652893, + "mean_norm/layer11": 11.498693943023682, + "mean_norm/layer12": 12.19723129272461, + "mean_norm/layer13": 11.140634655952454, + "mean_norm/layer14": 11.581675231456757, + "mean_norm/layer15": 11.995171904563904, + "mean_norm/layer16": 11.215030312538147, + "mean_norm/layer17": 11.763100147247314, + "mean_norm/layer18": 11.210864186286926, + "mean_norm/layer19": 11.28091686964035, + "mean_norm/layer2": 9.08584862947464, + "mean_norm/layer20": 11.38850075006485, + "mean_norm/layer21": 11.352761268615723, + "mean_norm/layer22": 12.517931997776031, + "mean_norm/layer23": 12.469390869140625, + "mean_norm/layer3": 11.968517303466797, + "mean_norm/layer4": 10.497656643390656, + "mean_norm/layer5": 13.405577003955841, + "mean_norm/layer6": 9.910086631774902, + "mean_norm/layer7": 10.536053538322449, + "mean_norm/layer8": 11.111887276172638, + "mean_norm/layer9": 11.025021851062775, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12700 + }, + { + "epoch": 5.3, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4685105640800996, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7220449447631836, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8546, + "eval_samples_per_second": 20.33, + "eval_steps_per_second": 0.675, + "step": 12700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.32, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3962, + "max_norm": 40.18087387084961, + "max_norm/layer0": 30.704357147216797, + "max_norm/layer1": 32.41680145263672, + "max_norm/layer10": 34.22196578979492, + "max_norm/layer11": 31.54886245727539, + "max_norm/layer12": 36.20389175415039, + "max_norm/layer13": 31.789897918701172, + "max_norm/layer14": 32.93586349487305, + "max_norm/layer15": 39.839820861816406, + "max_norm/layer16": 32.85014343261719, + "max_norm/layer17": 40.18087387084961, + "max_norm/layer18": 34.7507209777832, + "max_norm/layer19": 34.320194244384766, + "max_norm/layer2": 24.904115676879883, + "max_norm/layer20": 34.61308670043945, + "max_norm/layer21": 34.72566223144531, + "max_norm/layer22": 35.28715896606445, + "max_norm/layer23": 33.438289642333984, + "max_norm/layer3": 31.39183235168457, + "max_norm/layer4": 31.243642807006836, + "max_norm/layer5": 39.70951461791992, + "max_norm/layer6": 26.163026809692383, + "max_norm/layer7": 34.013248443603516, + "max_norm/layer8": 33.09016036987305, + "max_norm/layer9": 33.44902801513672, + "mean_norm": 11.350986532866955, + "mean_norm/layer0": 11.135516226291656, + "mean_norm/layer1": 10.794594943523407, + "mean_norm/layer10": 11.12837165594101, + "mean_norm/layer11": 11.509005963802338, + "mean_norm/layer12": 12.210427522659302, + "mean_norm/layer13": 11.150359153747559, + "mean_norm/layer14": 11.592359781265259, + "mean_norm/layer15": 12.007216930389404, + "mean_norm/layer16": 11.22458028793335, + "mean_norm/layer17": 11.773609936237335, + "mean_norm/layer18": 11.219653248786926, + "mean_norm/layer19": 11.29003256559372, + "mean_norm/layer2": 9.089622676372528, + "mean_norm/layer20": 11.397597908973694, + "mean_norm/layer21": 11.361972987651825, + "mean_norm/layer22": 12.5301353931427, + "mean_norm/layer23": 12.481706082820892, + "mean_norm/layer3": 11.98196655511856, + "mean_norm/layer4": 10.505818009376526, + "mean_norm/layer5": 13.423184752464294, + "mean_norm/layer6": 9.916291773319244, + "mean_norm/layer7": 10.543961584568024, + "mean_norm/layer8": 11.121361255645752, + "mean_norm/layer9": 11.03432959318161, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12750 + }, + { + "epoch": 5.32, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4678575339798737, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.725661516189575, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6564, + "eval_samples_per_second": 20.675, + "eval_steps_per_second": 0.686, + "step": 12750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.34, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4083, + "max_norm": 40.30177307128906, + "max_norm/layer0": 30.785463333129883, + "max_norm/layer1": 32.49075698852539, + "max_norm/layer10": 34.32855987548828, + "max_norm/layer11": 31.61981773376465, + "max_norm/layer12": 36.33092498779297, + "max_norm/layer13": 31.879899978637695, + "max_norm/layer14": 33.02179718017578, + "max_norm/layer15": 39.950584411621094, + "max_norm/layer16": 32.93088150024414, + "max_norm/layer17": 40.30177307128906, + "max_norm/layer18": 34.84276580810547, + "max_norm/layer19": 34.421875, + "max_norm/layer2": 24.946029663085938, + "max_norm/layer20": 34.69622802734375, + "max_norm/layer21": 34.828857421875, + "max_norm/layer22": 35.38137435913086, + "max_norm/layer23": 33.52065658569336, + "max_norm/layer3": 31.4727783203125, + "max_norm/layer4": 31.318620681762695, + "max_norm/layer5": 39.80884552001953, + "max_norm/layer6": 26.22019386291504, + "max_norm/layer7": 34.104026794433594, + "max_norm/layer8": 33.16169738769531, + "max_norm/layer9": 33.532066345214844, + "mean_norm": 11.361123723288378, + "mean_norm/layer0": 11.1495241522789, + "mean_norm/layer1": 10.804406702518463, + "mean_norm/layer10": 11.137525200843811, + "mean_norm/layer11": 11.519233465194702, + "mean_norm/layer12": 12.2235426902771, + "mean_norm/layer13": 11.16000908613205, + "mean_norm/layer14": 11.602903127670288, + "mean_norm/layer15": 12.019250571727753, + "mean_norm/layer16": 11.234025776386261, + "mean_norm/layer17": 11.783994853496552, + "mean_norm/layer18": 11.228349685668945, + "mean_norm/layer19": 11.299010992050171, + "mean_norm/layer2": 9.093325853347778, + "mean_norm/layer20": 11.406367242336273, + "mean_norm/layer21": 11.370973885059357, + "mean_norm/layer22": 12.54227989912033, + "mean_norm/layer23": 12.49396014213562, + "mean_norm/layer3": 11.995252788066864, + "mean_norm/layer4": 10.513902842998505, + "mean_norm/layer5": 13.440637111663818, + "mean_norm/layer6": 9.922372043132782, + "mean_norm/layer7": 10.55189323425293, + "mean_norm/layer8": 11.13077861070633, + "mean_norm/layer9": 11.043449401855469, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12800 + }, + { + "epoch": 5.34, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4677601878779767, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7198004722595215, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6292, + "eval_samples_per_second": 20.724, + "eval_steps_per_second": 0.688, + "step": 12800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.37, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3925, + "max_norm": 40.42647933959961, + "max_norm/layer0": 30.862247467041016, + "max_norm/layer1": 32.58104705810547, + "max_norm/layer10": 34.42935562133789, + "max_norm/layer11": 31.688074111938477, + "max_norm/layer12": 36.43111038208008, + "max_norm/layer13": 31.962995529174805, + "max_norm/layer14": 33.105018615722656, + "max_norm/layer15": 40.07574462890625, + "max_norm/layer16": 33.029239654541016, + "max_norm/layer17": 40.42647933959961, + "max_norm/layer18": 34.93319320678711, + "max_norm/layer19": 34.51870346069336, + "max_norm/layer2": 24.97833824157715, + "max_norm/layer20": 34.78074645996094, + "max_norm/layer21": 34.91769790649414, + "max_norm/layer22": 35.466556549072266, + "max_norm/layer23": 33.60380935668945, + "max_norm/layer3": 31.545141220092773, + "max_norm/layer4": 31.3936710357666, + "max_norm/layer5": 39.9000129699707, + "max_norm/layer6": 26.277626037597656, + "max_norm/layer7": 34.1938591003418, + "max_norm/layer8": 33.24137878417969, + "max_norm/layer9": 33.62035369873047, + "mean_norm": 11.371210957566896, + "mean_norm/layer0": 11.163536846637726, + "mean_norm/layer1": 10.814097344875336, + "mean_norm/layer10": 11.146620213985443, + "mean_norm/layer11": 11.529425144195557, + "mean_norm/layer12": 12.236510634422302, + "mean_norm/layer13": 11.1696857213974, + "mean_norm/layer14": 11.61343002319336, + "mean_norm/layer15": 12.031220376491547, + "mean_norm/layer16": 11.243366599082947, + "mean_norm/layer17": 11.79428768157959, + "mean_norm/layer18": 11.236949563026428, + "mean_norm/layer19": 11.307882249355316, + "mean_norm/layer2": 9.097050428390503, + "mean_norm/layer20": 11.415169477462769, + "mean_norm/layer21": 11.379999816417694, + "mean_norm/layer22": 12.554370284080505, + "mean_norm/layer23": 12.506138384342194, + "mean_norm/layer3": 12.008520364761353, + "mean_norm/layer4": 10.52201795578003, + "mean_norm/layer5": 13.457939386367798, + "mean_norm/layer6": 9.928470611572266, + "mean_norm/layer7": 10.559760689735413, + "mean_norm/layer8": 11.140100836753845, + "mean_norm/layer9": 11.052512347698212, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12850 + }, + { + "epoch": 5.37, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46929744507043397, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.721813440322876, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8261, + "eval_samples_per_second": 22.261, + "eval_steps_per_second": 0.739, + "step": 12850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.39, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4, + "max_norm": 40.53966522216797, + "max_norm/layer0": 30.93181610107422, + "max_norm/layer1": 32.67628479003906, + "max_norm/layer10": 34.52503204345703, + "max_norm/layer11": 31.753511428833008, + "max_norm/layer12": 36.52308654785156, + "max_norm/layer13": 32.05752944946289, + "max_norm/layer14": 33.178993225097656, + "max_norm/layer15": 40.18899917602539, + "max_norm/layer16": 33.12994384765625, + "max_norm/layer17": 40.53966522216797, + "max_norm/layer18": 35.019256591796875, + "max_norm/layer19": 34.60889434814453, + "max_norm/layer2": 25.012950897216797, + "max_norm/layer20": 34.865150451660156, + "max_norm/layer21": 34.9974479675293, + "max_norm/layer22": 35.567359924316406, + "max_norm/layer23": 33.68381881713867, + "max_norm/layer3": 31.623594284057617, + "max_norm/layer4": 31.476152420043945, + "max_norm/layer5": 39.99509811401367, + "max_norm/layer6": 26.33111000061035, + "max_norm/layer7": 34.27658462524414, + "max_norm/layer8": 33.315608978271484, + "max_norm/layer9": 33.71103286743164, + "mean_norm": 11.38135044525067, + "mean_norm/layer0": 11.177644968032837, + "mean_norm/layer1": 10.823881030082703, + "mean_norm/layer10": 11.155748844146729, + "mean_norm/layer11": 11.539595305919647, + "mean_norm/layer12": 12.249578356742859, + "mean_norm/layer13": 11.179333209991455, + "mean_norm/layer14": 11.62400072813034, + "mean_norm/layer15": 12.043241918087006, + "mean_norm/layer16": 11.252710223197937, + "mean_norm/layer17": 11.804608881473541, + "mean_norm/layer18": 11.245511174201965, + "mean_norm/layer19": 11.3168506026268, + "mean_norm/layer2": 9.100809633731842, + "mean_norm/layer20": 11.424018442630768, + "mean_norm/layer21": 11.388995170593262, + "mean_norm/layer22": 12.56649899482727, + "mean_norm/layer23": 12.51846170425415, + "mean_norm/layer3": 12.021824836730957, + "mean_norm/layer4": 10.53019380569458, + "mean_norm/layer5": 13.475353181362152, + "mean_norm/layer6": 9.934614837169647, + "mean_norm/layer7": 10.567758977413177, + "mean_norm/layer8": 11.149481892585754, + "mean_norm/layer9": 11.061693966388702, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12900 + }, + { + "epoch": 5.39, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4691068089542189, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.717646837234497, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6585, + "eval_samples_per_second": 20.672, + "eval_steps_per_second": 0.686, + "step": 12900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.41, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3993, + "max_norm": 40.673301696777344, + "max_norm/layer0": 30.998746871948242, + "max_norm/layer1": 32.77350616455078, + "max_norm/layer10": 34.62392807006836, + "max_norm/layer11": 31.82044219970703, + "max_norm/layer12": 36.621395111083984, + "max_norm/layer13": 32.15480041503906, + "max_norm/layer14": 33.264678955078125, + "max_norm/layer15": 40.30952453613281, + "max_norm/layer16": 33.21421813964844, + "max_norm/layer17": 40.673301696777344, + "max_norm/layer18": 35.126922607421875, + "max_norm/layer19": 34.703487396240234, + "max_norm/layer2": 25.046913146972656, + "max_norm/layer20": 34.96284484863281, + "max_norm/layer21": 35.083953857421875, + "max_norm/layer22": 35.669921875, + "max_norm/layer23": 33.7749137878418, + "max_norm/layer3": 31.69327163696289, + "max_norm/layer4": 31.55188751220703, + "max_norm/layer5": 40.09039306640625, + "max_norm/layer6": 26.382938385009766, + "max_norm/layer7": 34.37516784667969, + "max_norm/layer8": 33.3942985534668, + "max_norm/layer9": 33.79991149902344, + "mean_norm": 11.391558771332106, + "mean_norm/layer0": 11.191831350326538, + "mean_norm/layer1": 10.833774149417877, + "mean_norm/layer10": 11.165005505084991, + "mean_norm/layer11": 11.549969255924225, + "mean_norm/layer12": 12.262792706489563, + "mean_norm/layer13": 11.189042687416077, + "mean_norm/layer14": 11.634574472904205, + "mean_norm/layer15": 12.05532854795456, + "mean_norm/layer16": 11.26214224100113, + "mean_norm/layer17": 11.81501454114914, + "mean_norm/layer18": 11.254182398319244, + "mean_norm/layer19": 11.325855612754822, + "mean_norm/layer2": 9.104621648788452, + "mean_norm/layer20": 11.432913839817047, + "mean_norm/layer21": 11.398003339767456, + "mean_norm/layer22": 12.578662037849426, + "mean_norm/layer23": 12.530750453472137, + "mean_norm/layer3": 12.035245954990387, + "mean_norm/layer4": 10.538455426692963, + "mean_norm/layer5": 13.492934942245483, + "mean_norm/layer6": 9.94073635339737, + "mean_norm/layer7": 10.575691282749176, + "mean_norm/layer8": 11.15895789861679, + "mean_norm/layer9": 11.070923864841461, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 12950 + }, + { + "epoch": 5.41, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4688512754367392, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.718743324279785, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8444, + "eval_samples_per_second": 20.347, + "eval_steps_per_second": 0.675, + "step": 12950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.43, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4133, + "max_norm": 40.796546936035156, + "max_norm/layer0": 31.071434020996094, + "max_norm/layer1": 32.860477447509766, + "max_norm/layer10": 34.711509704589844, + "max_norm/layer11": 31.88778305053711, + "max_norm/layer12": 36.72361755371094, + "max_norm/layer13": 32.25141525268555, + "max_norm/layer14": 33.352420806884766, + "max_norm/layer15": 40.42947769165039, + "max_norm/layer16": 33.28781509399414, + "max_norm/layer17": 40.796546936035156, + "max_norm/layer18": 35.232322692871094, + "max_norm/layer19": 34.80649185180664, + "max_norm/layer2": 25.087366104125977, + "max_norm/layer20": 35.050086975097656, + "max_norm/layer21": 35.175132751464844, + "max_norm/layer22": 35.75883865356445, + "max_norm/layer23": 33.876068115234375, + "max_norm/layer3": 31.762784957885742, + "max_norm/layer4": 31.617982864379883, + "max_norm/layer5": 40.18153762817383, + "max_norm/layer6": 26.44247055053711, + "max_norm/layer7": 34.473243713378906, + "max_norm/layer8": 33.4754638671875, + "max_norm/layer9": 33.89864730834961, + "mean_norm": 11.40168750534455, + "mean_norm/layer0": 11.205902516841888, + "mean_norm/layer1": 10.84367960691452, + "mean_norm/layer10": 11.174164533615112, + "mean_norm/layer11": 11.560200273990631, + "mean_norm/layer12": 12.275927484035492, + "mean_norm/layer13": 11.198736369609833, + "mean_norm/layer14": 11.64512050151825, + "mean_norm/layer15": 12.067360758781433, + "mean_norm/layer16": 11.271453142166138, + "mean_norm/layer17": 11.825299143791199, + "mean_norm/layer18": 11.262673079967499, + "mean_norm/layer19": 11.33467322587967, + "mean_norm/layer2": 9.108363032341003, + "mean_norm/layer20": 11.441703617572784, + "mean_norm/layer21": 11.406952321529388, + "mean_norm/layer22": 12.590731382369995, + "mean_norm/layer23": 12.543003857135773, + "mean_norm/layer3": 12.048669159412384, + "mean_norm/layer4": 10.546570122241974, + "mean_norm/layer5": 13.510445177555084, + "mean_norm/layer6": 9.946801245212555, + "mean_norm/layer7": 10.583557188510895, + "mean_norm/layer8": 11.168345034122467, + "mean_norm/layer9": 11.080167353153229, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13000 + }, + { + "epoch": 5.43, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4694231837853843, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.722926616668701, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6383, + "eval_samples_per_second": 20.707, + "eval_steps_per_second": 0.687, + "step": 13000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.45, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4043, + "max_norm": 40.9404296875, + "max_norm/layer0": 31.16077423095703, + "max_norm/layer1": 32.95548629760742, + "max_norm/layer10": 34.809906005859375, + "max_norm/layer11": 31.963796615600586, + "max_norm/layer12": 36.830169677734375, + "max_norm/layer13": 32.35176467895508, + "max_norm/layer14": 33.43437194824219, + "max_norm/layer15": 40.522647857666016, + "max_norm/layer16": 33.36571502685547, + "max_norm/layer17": 40.9404296875, + "max_norm/layer18": 35.327171325683594, + "max_norm/layer19": 34.913414001464844, + "max_norm/layer2": 25.136255264282227, + "max_norm/layer20": 35.13398742675781, + "max_norm/layer21": 35.26042938232422, + "max_norm/layer22": 35.85120391845703, + "max_norm/layer23": 33.953338623046875, + "max_norm/layer3": 31.837873458862305, + "max_norm/layer4": 31.689170837402344, + "max_norm/layer5": 40.275970458984375, + "max_norm/layer6": 26.50471305847168, + "max_norm/layer7": 34.56406021118164, + "max_norm/layer8": 33.55378723144531, + "max_norm/layer9": 33.99280548095703, + "mean_norm": 11.41187767436107, + "mean_norm/layer0": 11.22002124786377, + "mean_norm/layer1": 10.853593170642853, + "mean_norm/layer10": 11.183394372463226, + "mean_norm/layer11": 11.570508360862732, + "mean_norm/layer12": 12.289067327976227, + "mean_norm/layer13": 11.208430171012878, + "mean_norm/layer14": 11.65568321943283, + "mean_norm/layer15": 12.07946515083313, + "mean_norm/layer16": 11.280861020088196, + "mean_norm/layer17": 11.835736393928528, + "mean_norm/layer18": 11.271266996860504, + "mean_norm/layer19": 11.343626499176025, + "mean_norm/layer2": 9.112095832824707, + "mean_norm/layer20": 11.450542509555817, + "mean_norm/layer21": 11.416008174419403, + "mean_norm/layer22": 12.602880716323853, + "mean_norm/layer23": 12.555341303348541, + "mean_norm/layer3": 12.062138319015503, + "mean_norm/layer4": 10.554663360118866, + "mean_norm/layer5": 13.528029143810272, + "mean_norm/layer6": 9.952929139137268, + "mean_norm/layer7": 10.591509401798248, + "mean_norm/layer8": 11.177850186824799, + "mean_norm/layer9": 11.089422166347504, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13050 + }, + { + "epoch": 5.45, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4680278896581935, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7215194702148438, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6317, + "eval_samples_per_second": 20.719, + "eval_steps_per_second": 0.688, + "step": 13050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.47, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4184, + "max_norm": 41.073753356933594, + "max_norm/layer0": 31.25911521911621, + "max_norm/layer1": 33.047813415527344, + "max_norm/layer10": 34.90483856201172, + "max_norm/layer11": 32.04907989501953, + "max_norm/layer12": 36.92471694946289, + "max_norm/layer13": 32.446258544921875, + "max_norm/layer14": 33.51337432861328, + "max_norm/layer15": 40.64415740966797, + "max_norm/layer16": 33.44923400878906, + "max_norm/layer17": 41.073753356933594, + "max_norm/layer18": 35.43497848510742, + "max_norm/layer19": 35.00997543334961, + "max_norm/layer2": 25.17824935913086, + "max_norm/layer20": 35.21885299682617, + "max_norm/layer21": 35.36158752441406, + "max_norm/layer22": 35.92625045776367, + "max_norm/layer23": 34.03020095825195, + "max_norm/layer3": 31.913679122924805, + "max_norm/layer4": 31.755531311035156, + "max_norm/layer5": 40.36668014526367, + "max_norm/layer6": 26.55792999267578, + "max_norm/layer7": 34.648197174072266, + "max_norm/layer8": 33.62436294555664, + "max_norm/layer9": 34.08570098876953, + "mean_norm": 11.421943314373493, + "mean_norm/layer0": 11.233939230442047, + "mean_norm/layer1": 10.863298058509827, + "mean_norm/layer10": 11.192550837993622, + "mean_norm/layer11": 11.580713331699371, + "mean_norm/layer12": 12.302023231983185, + "mean_norm/layer13": 11.218043863773346, + "mean_norm/layer14": 11.666103959083557, + "mean_norm/layer15": 12.091457724571228, + "mean_norm/layer16": 11.29023402929306, + "mean_norm/layer17": 11.846083104610443, + "mean_norm/layer18": 11.27977341413498, + "mean_norm/layer19": 11.352494895458221, + "mean_norm/layer2": 9.115803480148315, + "mean_norm/layer20": 11.45926821231842, + "mean_norm/layer21": 11.42496120929718, + "mean_norm/layer22": 12.614860355854034, + "mean_norm/layer23": 12.567517876625061, + "mean_norm/layer3": 12.075318932533264, + "mean_norm/layer4": 10.562665104866028, + "mean_norm/layer5": 13.545399487018585, + "mean_norm/layer6": 9.9589102268219, + "mean_norm/layer7": 10.599405288696289, + "mean_norm/layer8": 11.187245190143585, + "mean_norm/layer9": 11.098568499088287, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13100 + }, + { + "epoch": 5.47, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46916359418032555, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7211787700653076, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8252, + "eval_samples_per_second": 22.263, + "eval_steps_per_second": 0.739, + "step": 13100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.49, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4133, + "max_norm": 41.19325637817383, + "max_norm/layer0": 31.352529525756836, + "max_norm/layer1": 33.13313293457031, + "max_norm/layer10": 34.997493743896484, + "max_norm/layer11": 32.13360595703125, + "max_norm/layer12": 37.020450592041016, + "max_norm/layer13": 32.550804138183594, + "max_norm/layer14": 33.60025405883789, + "max_norm/layer15": 40.751651763916016, + "max_norm/layer16": 33.52793884277344, + "max_norm/layer17": 41.19325637817383, + "max_norm/layer18": 35.55864715576172, + "max_norm/layer19": 35.10562515258789, + "max_norm/layer2": 25.227224349975586, + "max_norm/layer20": 35.30140686035156, + "max_norm/layer21": 35.45964431762695, + "max_norm/layer22": 36.017539978027344, + "max_norm/layer23": 34.118995666503906, + "max_norm/layer3": 31.98078155517578, + "max_norm/layer4": 31.82782554626465, + "max_norm/layer5": 40.46044921875, + "max_norm/layer6": 26.614765167236328, + "max_norm/layer7": 34.73370361328125, + "max_norm/layer8": 33.699100494384766, + "max_norm/layer9": 34.17997741699219, + "mean_norm": 11.43214280406634, + "mean_norm/layer0": 11.247965574264526, + "mean_norm/layer1": 10.873225510120392, + "mean_norm/layer10": 11.20186734199524, + "mean_norm/layer11": 11.591102659702301, + "mean_norm/layer12": 12.315137565135956, + "mean_norm/layer13": 11.227831721305847, + "mean_norm/layer14": 11.676612555980682, + "mean_norm/layer15": 12.103615701198578, + "mean_norm/layer16": 11.29973292350769, + "mean_norm/layer17": 11.856513440608978, + "mean_norm/layer18": 11.288440763950348, + "mean_norm/layer19": 11.361487448215485, + "mean_norm/layer2": 9.11957997083664, + "mean_norm/layer20": 11.468166828155518, + "mean_norm/layer21": 11.433948516845703, + "mean_norm/layer22": 12.62698209285736, + "mean_norm/layer23": 12.579815804958344, + "mean_norm/layer3": 12.088749766349792, + "mean_norm/layer4": 10.570803761482239, + "mean_norm/layer5": 13.562963128089905, + "mean_norm/layer6": 9.965040504932404, + "mean_norm/layer7": 10.607343137264252, + "mean_norm/layer8": 11.196721315383911, + "mean_norm/layer9": 11.107779264450073, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13150 + }, + { + "epoch": 5.49, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4688472193491602, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7161834239959717, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8658, + "eval_samples_per_second": 20.31, + "eval_steps_per_second": 0.674, + "step": 13150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.51, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.412, + "max_norm": 41.33484649658203, + "max_norm/layer0": 31.432945251464844, + "max_norm/layer1": 33.227447509765625, + "max_norm/layer10": 35.095306396484375, + "max_norm/layer11": 32.22079849243164, + "max_norm/layer12": 37.126129150390625, + "max_norm/layer13": 32.637577056884766, + "max_norm/layer14": 33.67879104614258, + "max_norm/layer15": 40.858245849609375, + "max_norm/layer16": 33.607337951660156, + "max_norm/layer17": 41.33484649658203, + "max_norm/layer18": 35.682640075683594, + "max_norm/layer19": 35.209678649902344, + "max_norm/layer2": 25.263656616210938, + "max_norm/layer20": 35.401668548583984, + "max_norm/layer21": 35.54304885864258, + "max_norm/layer22": 36.10606384277344, + "max_norm/layer23": 34.20365524291992, + "max_norm/layer3": 32.0433349609375, + "max_norm/layer4": 31.899898529052734, + "max_norm/layer5": 40.55813980102539, + "max_norm/layer6": 26.6668643951416, + "max_norm/layer7": 34.81508255004883, + "max_norm/layer8": 33.77111053466797, + "max_norm/layer9": 34.279014587402344, + "mean_norm": 11.442247187097868, + "mean_norm/layer0": 11.261785089969635, + "mean_norm/layer1": 10.883079826831818, + "mean_norm/layer10": 11.210987150669098, + "mean_norm/layer11": 11.601315975189209, + "mean_norm/layer12": 12.32822459936142, + "mean_norm/layer13": 11.237483143806458, + "mean_norm/layer14": 11.68710470199585, + "mean_norm/layer15": 12.11562329530716, + "mean_norm/layer16": 11.309135794639587, + "mean_norm/layer17": 11.86676573753357, + "mean_norm/layer18": 11.296909749507904, + "mean_norm/layer19": 11.37040263414383, + "mean_norm/layer2": 9.123386025428772, + "mean_norm/layer20": 11.477011442184448, + "mean_norm/layer21": 11.442870557308197, + "mean_norm/layer22": 12.638907492160797, + "mean_norm/layer23": 12.591942846775055, + "mean_norm/layer3": 12.102109968662262, + "mean_norm/layer4": 10.578868985176086, + "mean_norm/layer5": 13.58046168088913, + "mean_norm/layer6": 9.971136212348938, + "mean_norm/layer7": 10.61527305841446, + "mean_norm/layer8": 11.206160426139832, + "mean_norm/layer9": 11.116986095905304, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13200 + }, + { + "epoch": 5.51, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46872959280936793, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.717339515686035, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8507, + "eval_samples_per_second": 20.336, + "eval_steps_per_second": 0.675, + "step": 13200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.53, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4223, + "max_norm": 41.460872650146484, + "max_norm/layer0": 31.52048110961914, + "max_norm/layer1": 33.32143020629883, + "max_norm/layer10": 35.188270568847656, + "max_norm/layer11": 32.29136657714844, + "max_norm/layer12": 37.231136322021484, + "max_norm/layer13": 32.73362350463867, + "max_norm/layer14": 33.75789260864258, + "max_norm/layer15": 40.970985412597656, + "max_norm/layer16": 33.6841926574707, + "max_norm/layer17": 41.460872650146484, + "max_norm/layer18": 35.798545837402344, + "max_norm/layer19": 35.29481506347656, + "max_norm/layer2": 25.29656219482422, + "max_norm/layer20": 35.4903450012207, + "max_norm/layer21": 35.632667541503906, + "max_norm/layer22": 36.19403839111328, + "max_norm/layer23": 34.284523010253906, + "max_norm/layer3": 32.09943771362305, + "max_norm/layer4": 31.967790603637695, + "max_norm/layer5": 40.65348434448242, + "max_norm/layer6": 26.707876205444336, + "max_norm/layer7": 34.904991149902344, + "max_norm/layer8": 33.850345611572266, + "max_norm/layer9": 34.3624267578125, + "mean_norm": 11.452307460208734, + "mean_norm/layer0": 11.275518834590912, + "mean_norm/layer1": 10.892802596092224, + "mean_norm/layer10": 11.22011786699295, + "mean_norm/layer11": 11.611432790756226, + "mean_norm/layer12": 12.341229736804962, + "mean_norm/layer13": 11.247182369232178, + "mean_norm/layer14": 11.697576940059662, + "mean_norm/layer15": 12.127613306045532, + "mean_norm/layer16": 11.318461954593658, + "mean_norm/layer17": 11.877028286457062, + "mean_norm/layer18": 11.305418491363525, + "mean_norm/layer19": 11.379250943660736, + "mean_norm/layer2": 9.127110540866852, + "mean_norm/layer20": 11.485674262046814, + "mean_norm/layer21": 11.451743423938751, + "mean_norm/layer22": 12.650978088378906, + "mean_norm/layer23": 12.604095160961151, + "mean_norm/layer3": 12.115413546562195, + "mean_norm/layer4": 10.586904525756836, + "mean_norm/layer5": 13.59795880317688, + "mean_norm/layer6": 9.977186620235443, + "mean_norm/layer7": 10.623132765293121, + "mean_norm/layer8": 11.215501189231873, + "mean_norm/layer9": 11.126046001911163, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13250 + }, + { + "epoch": 5.53, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4688958924001087, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7104713916778564, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6498, + "eval_samples_per_second": 20.687, + "eval_steps_per_second": 0.687, + "step": 13250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.55, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4168, + "max_norm": 41.58987808227539, + "max_norm/layer0": 31.605928421020508, + "max_norm/layer1": 33.41110610961914, + "max_norm/layer10": 35.28288650512695, + "max_norm/layer11": 32.35896682739258, + "max_norm/layer12": 37.328975677490234, + "max_norm/layer13": 32.81481170654297, + "max_norm/layer14": 33.8287353515625, + "max_norm/layer15": 41.096561431884766, + "max_norm/layer16": 33.78337860107422, + "max_norm/layer17": 41.58987808227539, + "max_norm/layer18": 35.9139289855957, + "max_norm/layer19": 35.399471282958984, + "max_norm/layer2": 25.34184455871582, + "max_norm/layer20": 35.5942497253418, + "max_norm/layer21": 35.72600173950195, + "max_norm/layer22": 36.28502655029297, + "max_norm/layer23": 34.368873596191406, + "max_norm/layer3": 32.15465545654297, + "max_norm/layer4": 32.03687286376953, + "max_norm/layer5": 40.74073791503906, + "max_norm/layer6": 26.754438400268555, + "max_norm/layer7": 34.99358367919922, + "max_norm/layer8": 33.9345703125, + "max_norm/layer9": 34.452205657958984, + "mean_norm": 11.462326402465502, + "mean_norm/layer0": 11.28924685716629, + "mean_norm/layer1": 10.902493834495544, + "mean_norm/layer10": 11.229179680347443, + "mean_norm/layer11": 11.621479094028473, + "mean_norm/layer12": 12.354156792163849, + "mean_norm/layer13": 11.256803750991821, + "mean_norm/layer14": 11.707986295223236, + "mean_norm/layer15": 12.139529526233673, + "mean_norm/layer16": 11.327766597270966, + "mean_norm/layer17": 11.887259781360626, + "mean_norm/layer18": 11.313856422901154, + "mean_norm/layer19": 11.38800984621048, + "mean_norm/layer2": 9.13087511062622, + "mean_norm/layer20": 11.49438589811325, + "mean_norm/layer21": 11.460516810417175, + "mean_norm/layer22": 12.663020372390747, + "mean_norm/layer23": 12.616227269172668, + "mean_norm/layer3": 12.128678977489471, + "mean_norm/layer4": 10.594914734363556, + "mean_norm/layer5": 13.615288376808167, + "mean_norm/layer6": 9.983207881450653, + "mean_norm/layer7": 10.631061017513275, + "mean_norm/layer8": 11.224867701530457, + "mean_norm/layer9": 11.135021030902863, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13300 + }, + { + "epoch": 5.55, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46990991429486945, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7142724990844727, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6426, + "eval_samples_per_second": 20.7, + "eval_steps_per_second": 0.687, + "step": 13300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.57, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4235, + "max_norm": 41.713775634765625, + "max_norm/layer0": 31.692907333374023, + "max_norm/layer1": 33.50731658935547, + "max_norm/layer10": 35.388431549072266, + "max_norm/layer11": 32.41889190673828, + "max_norm/layer12": 37.428932189941406, + "max_norm/layer13": 32.89790344238281, + "max_norm/layer14": 33.91184997558594, + "max_norm/layer15": 41.21902847290039, + "max_norm/layer16": 33.867496490478516, + "max_norm/layer17": 41.713775634765625, + "max_norm/layer18": 36.05093765258789, + "max_norm/layer19": 35.49272155761719, + "max_norm/layer2": 25.380748748779297, + "max_norm/layer20": 35.684383392333984, + "max_norm/layer21": 35.81870651245117, + "max_norm/layer22": 36.37220764160156, + "max_norm/layer23": 34.44894027709961, + "max_norm/layer3": 32.21410369873047, + "max_norm/layer4": 32.11796569824219, + "max_norm/layer5": 40.8372802734375, + "max_norm/layer6": 26.808568954467773, + "max_norm/layer7": 35.08625793457031, + "max_norm/layer8": 34.01543426513672, + "max_norm/layer9": 34.54030227661133, + "mean_norm": 11.472280822694302, + "mean_norm/layer0": 11.302962839603424, + "mean_norm/layer1": 10.912257492542267, + "mean_norm/layer10": 11.238200902938843, + "mean_norm/layer11": 11.631586790084839, + "mean_norm/layer12": 12.366995334625244, + "mean_norm/layer13": 11.266227841377258, + "mean_norm/layer14": 11.718317866325378, + "mean_norm/layer15": 12.151341676712036, + "mean_norm/layer16": 11.337043285369873, + "mean_norm/layer17": 11.89738005399704, + "mean_norm/layer18": 11.322262048721313, + "mean_norm/layer19": 11.39665973186493, + "mean_norm/layer2": 9.134590566158295, + "mean_norm/layer20": 11.503011286258698, + "mean_norm/layer21": 11.469366490840912, + "mean_norm/layer22": 12.674902260303497, + "mean_norm/layer23": 12.628194808959961, + "mean_norm/layer3": 12.14181238412857, + "mean_norm/layer4": 10.602854549884796, + "mean_norm/layer5": 13.632572889328003, + "mean_norm/layer6": 9.989143371582031, + "mean_norm/layer7": 10.638879597187042, + "mean_norm/layer8": 11.23413860797882, + "mean_norm/layer9": 11.144037067890167, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13350 + }, + { + "epoch": 5.57, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46916359418032555, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.714078426361084, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8326, + "eval_samples_per_second": 20.367, + "eval_steps_per_second": 0.676, + "step": 13350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.59, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4219, + "max_norm": 41.837982177734375, + "max_norm/layer0": 31.79075813293457, + "max_norm/layer1": 33.60240936279297, + "max_norm/layer10": 35.48202896118164, + "max_norm/layer11": 32.483062744140625, + "max_norm/layer12": 37.52994155883789, + "max_norm/layer13": 32.990882873535156, + "max_norm/layer14": 33.9993782043457, + "max_norm/layer15": 41.33662414550781, + "max_norm/layer16": 33.95119094848633, + "max_norm/layer17": 41.837982177734375, + "max_norm/layer18": 36.17069625854492, + "max_norm/layer19": 35.598567962646484, + "max_norm/layer2": 25.41947364807129, + "max_norm/layer20": 35.76862716674805, + "max_norm/layer21": 35.891048431396484, + "max_norm/layer22": 36.46067810058594, + "max_norm/layer23": 34.52641296386719, + "max_norm/layer3": 32.27833938598633, + "max_norm/layer4": 32.184410095214844, + "max_norm/layer5": 40.935646057128906, + "max_norm/layer6": 26.854347229003906, + "max_norm/layer7": 35.179630279541016, + "max_norm/layer8": 34.0980110168457, + "max_norm/layer9": 34.62184143066406, + "mean_norm": 11.482310282687346, + "mean_norm/layer0": 11.316719889640808, + "mean_norm/layer1": 10.922053396701813, + "mean_norm/layer10": 11.247276484966278, + "mean_norm/layer11": 11.64177393913269, + "mean_norm/layer12": 12.379945814609528, + "mean_norm/layer13": 11.275794327259064, + "mean_norm/layer14": 11.72872668504715, + "mean_norm/layer15": 12.163222134113312, + "mean_norm/layer16": 11.346361517906189, + "mean_norm/layer17": 11.907587885856628, + "mean_norm/layer18": 11.330709755420685, + "mean_norm/layer19": 11.40546178817749, + "mean_norm/layer2": 9.138280272483826, + "mean_norm/layer20": 11.511772215366364, + "mean_norm/layer21": 11.478142619132996, + "mean_norm/layer22": 12.686840951442719, + "mean_norm/layer23": 12.640309393405914, + "mean_norm/layer3": 12.155011892318726, + "mean_norm/layer4": 10.610854387283325, + "mean_norm/layer5": 13.649908483028412, + "mean_norm/layer6": 9.995129764080048, + "mean_norm/layer7": 10.6467826962471, + "mean_norm/layer8": 11.243535876274109, + "mean_norm/layer9": 11.153244614601135, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13400 + }, + { + "epoch": 5.59, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46905813590327045, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.711637496948242, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6452, + "eval_samples_per_second": 20.695, + "eval_steps_per_second": 0.687, + "step": 13400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.62, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4137, + "max_norm": 41.95629119873047, + "max_norm/layer0": 31.894800186157227, + "max_norm/layer1": 33.70528793334961, + "max_norm/layer10": 35.5774040222168, + "max_norm/layer11": 32.56145095825195, + "max_norm/layer12": 37.62503433227539, + "max_norm/layer13": 33.0743408203125, + "max_norm/layer14": 34.08401107788086, + "max_norm/layer15": 41.45420455932617, + "max_norm/layer16": 34.023075103759766, + "max_norm/layer17": 41.95629119873047, + "max_norm/layer18": 36.291751861572266, + "max_norm/layer19": 35.699798583984375, + "max_norm/layer2": 25.462074279785156, + "max_norm/layer20": 35.848453521728516, + "max_norm/layer21": 35.9924430847168, + "max_norm/layer22": 36.55889892578125, + "max_norm/layer23": 34.61848449707031, + "max_norm/layer3": 32.35057830810547, + "max_norm/layer4": 32.256893157958984, + "max_norm/layer5": 41.03318786621094, + "max_norm/layer6": 26.913339614868164, + "max_norm/layer7": 35.26021957397461, + "max_norm/layer8": 34.18633270263672, + "max_norm/layer9": 34.706512451171875, + "mean_norm": 11.492379434406757, + "mean_norm/layer0": 11.330553650856018, + "mean_norm/layer1": 10.931818127632141, + "mean_norm/layer10": 11.256403625011444, + "mean_norm/layer11": 11.652017891407013, + "mean_norm/layer12": 12.392934620380402, + "mean_norm/layer13": 11.2853382229805, + "mean_norm/layer14": 11.739181399345398, + "mean_norm/layer15": 12.175087809562683, + "mean_norm/layer16": 11.355721652507782, + "mean_norm/layer17": 11.917894303798676, + "mean_norm/layer18": 11.339221060276031, + "mean_norm/layer19": 11.414319634437561, + "mean_norm/layer2": 9.14203691482544, + "mean_norm/layer20": 11.520379364490509, + "mean_norm/layer21": 11.487022876739502, + "mean_norm/layer22": 12.698857307434082, + "mean_norm/layer23": 12.652542471885681, + "mean_norm/layer3": 12.168289422988892, + "mean_norm/layer4": 10.618834555149078, + "mean_norm/layer5": 13.667337656021118, + "mean_norm/layer6": 10.001234710216522, + "mean_norm/layer7": 10.654753506183624, + "mean_norm/layer8": 11.252941370010376, + "mean_norm/layer9": 11.162384271621704, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13450 + }, + { + "epoch": 5.62, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4691311454796932, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.709066390991211, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6434, + "eval_samples_per_second": 20.698, + "eval_steps_per_second": 0.687, + "step": 13450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.64, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4237, + "max_norm": 42.06662368774414, + "max_norm/layer0": 31.995527267456055, + "max_norm/layer1": 33.81433868408203, + "max_norm/layer10": 35.674861907958984, + "max_norm/layer11": 32.633907318115234, + "max_norm/layer12": 37.72537612915039, + "max_norm/layer13": 33.15221405029297, + "max_norm/layer14": 34.16411590576172, + "max_norm/layer15": 41.57180404663086, + "max_norm/layer16": 34.10177993774414, + "max_norm/layer17": 42.06662368774414, + "max_norm/layer18": 36.408756256103516, + "max_norm/layer19": 35.804447174072266, + "max_norm/layer2": 25.517255783081055, + "max_norm/layer20": 35.92195129394531, + "max_norm/layer21": 36.10334777832031, + "max_norm/layer22": 36.6356086730957, + "max_norm/layer23": 34.714378356933594, + "max_norm/layer3": 32.415916442871094, + "max_norm/layer4": 32.33707046508789, + "max_norm/layer5": 41.12393569946289, + "max_norm/layer6": 26.9628849029541, + "max_norm/layer7": 35.34476852416992, + "max_norm/layer8": 34.27030563354492, + "max_norm/layer9": 34.790771484375, + "mean_norm": 11.502338218192259, + "mean_norm/layer0": 11.344147622585297, + "mean_norm/layer1": 10.941574037075043, + "mean_norm/layer10": 11.26539170742035, + "mean_norm/layer11": 11.66208666563034, + "mean_norm/layer12": 12.405764102935791, + "mean_norm/layer13": 11.294852435588837, + "mean_norm/layer14": 11.749512732028961, + "mean_norm/layer15": 12.18685758113861, + "mean_norm/layer16": 11.364993393421173, + "mean_norm/layer17": 11.928065538406372, + "mean_norm/layer18": 11.347671389579773, + "mean_norm/layer19": 11.423152148723602, + "mean_norm/layer2": 9.145713448524475, + "mean_norm/layer20": 11.52916818857193, + "mean_norm/layer21": 11.49576997756958, + "mean_norm/layer22": 12.710700571537018, + "mean_norm/layer23": 12.664546847343445, + "mean_norm/layer3": 12.181446313858032, + "mean_norm/layer4": 10.626774251461029, + "mean_norm/layer5": 13.684615194797516, + "mean_norm/layer6": 10.00717294216156, + "mean_norm/layer7": 10.662572145462036, + "mean_norm/layer8": 11.262239933013916, + "mean_norm/layer9": 11.171328067779541, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13500 + }, + { + "epoch": 5.64, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4694353520481214, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7050700187683105, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.81, + "eval_samples_per_second": 22.294, + "eval_steps_per_second": 0.74, + "step": 13500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.66, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4288, + "max_norm": 42.18446350097656, + "max_norm/layer0": 32.09495162963867, + "max_norm/layer1": 33.92106246948242, + "max_norm/layer10": 35.778926849365234, + "max_norm/layer11": 32.708717346191406, + "max_norm/layer12": 37.83408737182617, + "max_norm/layer13": 33.22709274291992, + "max_norm/layer14": 34.2531852722168, + "max_norm/layer15": 41.674163818359375, + "max_norm/layer16": 34.1853141784668, + "max_norm/layer17": 42.18446350097656, + "max_norm/layer18": 36.49985885620117, + "max_norm/layer19": 35.90671157836914, + "max_norm/layer2": 25.565250396728516, + "max_norm/layer20": 36.003273010253906, + "max_norm/layer21": 36.20390319824219, + "max_norm/layer22": 36.71393585205078, + "max_norm/layer23": 34.7982292175293, + "max_norm/layer3": 32.48151397705078, + "max_norm/layer4": 32.41646194458008, + "max_norm/layer5": 41.22113800048828, + "max_norm/layer6": 27.021968841552734, + "max_norm/layer7": 35.427452087402344, + "max_norm/layer8": 34.34320068359375, + "max_norm/layer9": 34.87732696533203, + "mean_norm": 11.512315717836222, + "mean_norm/layer0": 11.357698917388916, + "mean_norm/layer1": 10.951256394386292, + "mean_norm/layer10": 11.274416208267212, + "mean_norm/layer11": 11.672086000442505, + "mean_norm/layer12": 12.41863089799881, + "mean_norm/layer13": 11.30438607931137, + "mean_norm/layer14": 11.759986698627472, + "mean_norm/layer15": 12.198642432689667, + "mean_norm/layer16": 11.374230086803436, + "mean_norm/layer17": 11.938192427158356, + "mean_norm/layer18": 11.356159150600433, + "mean_norm/layer19": 11.432008922100067, + "mean_norm/layer2": 9.14939570426941, + "mean_norm/layer20": 11.537839412689209, + "mean_norm/layer21": 11.504580557346344, + "mean_norm/layer22": 12.722698092460632, + "mean_norm/layer23": 12.676586389541626, + "mean_norm/layer3": 12.194705128669739, + "mean_norm/layer4": 10.634714663028717, + "mean_norm/layer5": 13.701936960220337, + "mean_norm/layer6": 10.013112783432007, + "mean_norm/layer7": 10.670415759086609, + "mean_norm/layer8": 11.271536707878113, + "mean_norm/layer9": 11.180360853672028, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13550 + }, + { + "epoch": 5.66, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46922037940643213, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7097346782684326, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.847, + "eval_samples_per_second": 20.343, + "eval_steps_per_second": 0.675, + "step": 13550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.68, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.417, + "max_norm": 42.29948043823242, + "max_norm/layer0": 32.19629669189453, + "max_norm/layer1": 34.0298957824707, + "max_norm/layer10": 35.873329162597656, + "max_norm/layer11": 32.782554626464844, + "max_norm/layer12": 37.94023895263672, + "max_norm/layer13": 33.30521011352539, + "max_norm/layer14": 34.3357048034668, + "max_norm/layer15": 41.79225540161133, + "max_norm/layer16": 34.278114318847656, + "max_norm/layer17": 42.29948043823242, + "max_norm/layer18": 36.587486267089844, + "max_norm/layer19": 36.01373291015625, + "max_norm/layer2": 25.616296768188477, + "max_norm/layer20": 36.0982780456543, + "max_norm/layer21": 36.2936897277832, + "max_norm/layer22": 36.797672271728516, + "max_norm/layer23": 34.886837005615234, + "max_norm/layer3": 32.53889846801758, + "max_norm/layer4": 32.496707916259766, + "max_norm/layer5": 41.32212448120117, + "max_norm/layer6": 27.078197479248047, + "max_norm/layer7": 35.5162467956543, + "max_norm/layer8": 34.416038513183594, + "max_norm/layer9": 34.968238830566406, + "mean_norm": 11.52224476635456, + "mean_norm/layer0": 11.371230006217957, + "mean_norm/layer1": 10.96083915233612, + "mean_norm/layer10": 11.283371925354004, + "mean_norm/layer11": 11.682111740112305, + "mean_norm/layer12": 12.431476056575775, + "mean_norm/layer13": 11.313903331756592, + "mean_norm/layer14": 11.770337045192719, + "mean_norm/layer15": 12.210534811019897, + "mean_norm/layer16": 11.383462309837341, + "mean_norm/layer17": 11.948289573192596, + "mean_norm/layer18": 11.364611744880676, + "mean_norm/layer19": 11.440718173980713, + "mean_norm/layer2": 9.153079271316528, + "mean_norm/layer20": 11.54639196395874, + "mean_norm/layer21": 11.51335096359253, + "mean_norm/layer22": 12.734551429748535, + "mean_norm/layer23": 12.68855208158493, + "mean_norm/layer3": 12.207791090011597, + "mean_norm/layer4": 10.642626106739044, + "mean_norm/layer5": 13.719220459461212, + "mean_norm/layer6": 10.01904433965683, + "mean_norm/layer7": 10.678197205066681, + "mean_norm/layer8": 11.280803203582764, + "mean_norm/layer9": 11.189380407333374, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13600 + }, + { + "epoch": 5.68, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4692325476691693, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7084743976593018, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8418, + "eval_samples_per_second": 20.352, + "eval_steps_per_second": 0.676, + "step": 13600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.7, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4312, + "max_norm": 42.4152717590332, + "max_norm/layer0": 32.290565490722656, + "max_norm/layer1": 34.130165100097656, + "max_norm/layer10": 35.96076202392578, + "max_norm/layer11": 32.853206634521484, + "max_norm/layer12": 38.056854248046875, + "max_norm/layer13": 33.386722564697266, + "max_norm/layer14": 34.417293548583984, + "max_norm/layer15": 41.91092300415039, + "max_norm/layer16": 34.39151382446289, + "max_norm/layer17": 42.4152717590332, + "max_norm/layer18": 36.677120208740234, + "max_norm/layer19": 36.10676956176758, + "max_norm/layer2": 25.653728485107422, + "max_norm/layer20": 36.18156051635742, + "max_norm/layer21": 36.40180969238281, + "max_norm/layer22": 36.877620697021484, + "max_norm/layer23": 34.97404479980469, + "max_norm/layer3": 32.59130096435547, + "max_norm/layer4": 32.57655334472656, + "max_norm/layer5": 41.421573638916016, + "max_norm/layer6": 27.125125885009766, + "max_norm/layer7": 35.60506057739258, + "max_norm/layer8": 34.491661071777344, + "max_norm/layer9": 35.03976821899414, + "mean_norm": 11.532145649194717, + "mean_norm/layer0": 11.38479232788086, + "mean_norm/layer1": 10.970433294773102, + "mean_norm/layer10": 11.292322337627411, + "mean_norm/layer11": 11.692193269729614, + "mean_norm/layer12": 12.444232642650604, + "mean_norm/layer13": 11.323309123516083, + "mean_norm/layer14": 11.780568301677704, + "mean_norm/layer15": 12.2222620844841, + "mean_norm/layer16": 11.392680704593658, + "mean_norm/layer17": 11.958375811576843, + "mean_norm/layer18": 11.373052775859833, + "mean_norm/layer19": 11.449408113956451, + "mean_norm/layer2": 9.156772315502167, + "mean_norm/layer20": 11.555001676082611, + "mean_norm/layer21": 11.522112011909485, + "mean_norm/layer22": 12.746351480484009, + "mean_norm/layer23": 12.700541198253632, + "mean_norm/layer3": 12.220799148082733, + "mean_norm/layer4": 10.650478422641754, + "mean_norm/layer5": 13.736432790756226, + "mean_norm/layer6": 10.024990856647491, + "mean_norm/layer7": 10.685915529727936, + "mean_norm/layer8": 11.290149748325348, + "mean_norm/layer9": 11.198319613933563, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13650 + }, + { + "epoch": 5.7, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4698977460321323, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.709822177886963, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8453, + "eval_samples_per_second": 20.346, + "eval_steps_per_second": 0.675, + "step": 13650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.72, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4277, + "max_norm": 42.53453063964844, + "max_norm/layer0": 32.37334060668945, + "max_norm/layer1": 34.23046875, + "max_norm/layer10": 36.06345748901367, + "max_norm/layer11": 32.92584228515625, + "max_norm/layer12": 38.15459442138672, + "max_norm/layer13": 33.48106002807617, + "max_norm/layer14": 34.505126953125, + "max_norm/layer15": 42.039798736572266, + "max_norm/layer16": 34.5018196105957, + "max_norm/layer17": 42.53453063964844, + "max_norm/layer18": 36.77006530761719, + "max_norm/layer19": 36.20204162597656, + "max_norm/layer2": 25.69436264038086, + "max_norm/layer20": 36.26368713378906, + "max_norm/layer21": 36.49669647216797, + "max_norm/layer22": 36.958030700683594, + "max_norm/layer23": 35.077667236328125, + "max_norm/layer3": 32.64958953857422, + "max_norm/layer4": 32.6416130065918, + "max_norm/layer5": 41.52423858642578, + "max_norm/layer6": 27.177854537963867, + "max_norm/layer7": 35.69281005859375, + "max_norm/layer8": 34.58332061767578, + "max_norm/layer9": 35.11589050292969, + "mean_norm": 11.542051893969377, + "mean_norm/layer0": 11.398241758346558, + "mean_norm/layer1": 10.9800386428833, + "mean_norm/layer10": 11.301402509212494, + "mean_norm/layer11": 11.70227837562561, + "mean_norm/layer12": 12.457101702690125, + "mean_norm/layer13": 11.332804679870605, + "mean_norm/layer14": 11.790894746780396, + "mean_norm/layer15": 12.233994662761688, + "mean_norm/layer16": 11.401872217655182, + "mean_norm/layer17": 11.96843957901001, + "mean_norm/layer18": 11.381479799747467, + "mean_norm/layer19": 11.45817643404007, + "mean_norm/layer2": 9.160508751869202, + "mean_norm/layer20": 11.563453137874603, + "mean_norm/layer21": 11.530731439590454, + "mean_norm/layer22": 12.75810968875885, + "mean_norm/layer23": 12.712501466274261, + "mean_norm/layer3": 12.233920216560364, + "mean_norm/layer4": 10.658356189727783, + "mean_norm/layer5": 13.753542840480804, + "mean_norm/layer6": 10.030904114246368, + "mean_norm/layer7": 10.693680703639984, + "mean_norm/layer8": 11.299498975276947, + "mean_norm/layer9": 11.207312822341919, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13700 + }, + { + "epoch": 5.72, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47006810171045216, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.705110549926758, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8501, + "eval_samples_per_second": 20.337, + "eval_steps_per_second": 0.675, + "step": 13700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.74, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4468, + "max_norm": 42.64570999145508, + "max_norm/layer0": 32.44587707519531, + "max_norm/layer1": 34.328102111816406, + "max_norm/layer10": 36.16082763671875, + "max_norm/layer11": 32.99917984008789, + "max_norm/layer12": 38.26010513305664, + "max_norm/layer13": 33.561012268066406, + "max_norm/layer14": 34.574607849121094, + "max_norm/layer15": 42.16282653808594, + "max_norm/layer16": 34.6053466796875, + "max_norm/layer17": 42.64570999145508, + "max_norm/layer18": 36.88127899169922, + "max_norm/layer19": 36.302093505859375, + "max_norm/layer2": 25.726064682006836, + "max_norm/layer20": 36.354103088378906, + "max_norm/layer21": 36.58729934692383, + "max_norm/layer22": 37.044952392578125, + "max_norm/layer23": 35.16257858276367, + "max_norm/layer3": 32.70930480957031, + "max_norm/layer4": 32.71389389038086, + "max_norm/layer5": 41.630611419677734, + "max_norm/layer6": 27.24214744567871, + "max_norm/layer7": 35.78268051147461, + "max_norm/layer8": 34.67084503173828, + "max_norm/layer9": 35.19058609008789, + "mean_norm": 11.55191034078598, + "mean_norm/layer0": 11.41158139705658, + "mean_norm/layer1": 10.989613711833954, + "mean_norm/layer10": 11.31038248538971, + "mean_norm/layer11": 11.712275445461273, + "mean_norm/layer12": 12.469912946224213, + "mean_norm/layer13": 11.342234253883362, + "mean_norm/layer14": 11.801217436790466, + "mean_norm/layer15": 12.245729267597198, + "mean_norm/layer16": 11.411094605922699, + "mean_norm/layer17": 11.978409945964813, + "mean_norm/layer18": 11.38983964920044, + "mean_norm/layer19": 11.466777920722961, + "mean_norm/layer2": 9.164218246936798, + "mean_norm/layer20": 11.571929335594177, + "mean_norm/layer21": 11.539337873458862, + "mean_norm/layer22": 12.769851624965668, + "mean_norm/layer23": 12.7243931889534, + "mean_norm/layer3": 12.246965825557709, + "mean_norm/layer4": 10.66619747877121, + "mean_norm/layer5": 13.770685732364655, + "mean_norm/layer6": 10.03677612543106, + "mean_norm/layer7": 10.701447129249573, + "mean_norm/layer8": 11.308717370033264, + "mean_norm/layer9": 11.216259181499481, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13750 + }, + { + "epoch": 5.74, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4706521783218343, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7009119987487793, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8368, + "eval_samples_per_second": 20.36, + "eval_steps_per_second": 0.676, + "step": 13750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.76, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4278, + "max_norm": 42.74515151977539, + "max_norm/layer0": 32.518287658691406, + "max_norm/layer1": 34.43461990356445, + "max_norm/layer10": 36.25341033935547, + "max_norm/layer11": 33.06514358520508, + "max_norm/layer12": 38.34977340698242, + "max_norm/layer13": 33.64243698120117, + "max_norm/layer14": 34.654720306396484, + "max_norm/layer15": 42.259647369384766, + "max_norm/layer16": 34.71818542480469, + "max_norm/layer17": 42.74515151977539, + "max_norm/layer18": 36.984222412109375, + "max_norm/layer19": 36.397159576416016, + "max_norm/layer2": 25.7700252532959, + "max_norm/layer20": 36.44501876831055, + "max_norm/layer21": 36.675048828125, + "max_norm/layer22": 37.133079528808594, + "max_norm/layer23": 35.23983383178711, + "max_norm/layer3": 32.766868591308594, + "max_norm/layer4": 32.78180694580078, + "max_norm/layer5": 41.73137283325195, + "max_norm/layer6": 27.297748565673828, + "max_norm/layer7": 35.863887786865234, + "max_norm/layer8": 34.7591438293457, + "max_norm/layer9": 35.272220611572266, + "mean_norm": 11.561812994380793, + "mean_norm/layer0": 11.425028920173645, + "mean_norm/layer1": 10.999259412288666, + "mean_norm/layer10": 11.319396913051605, + "mean_norm/layer11": 11.722336232662201, + "mean_norm/layer12": 12.482789993286133, + "mean_norm/layer13": 11.35170429944992, + "mean_norm/layer14": 11.811590790748596, + "mean_norm/layer15": 12.257381975650787, + "mean_norm/layer16": 11.42035436630249, + "mean_norm/layer17": 11.988508760929108, + "mean_norm/layer18": 11.398184061050415, + "mean_norm/layer19": 11.475438952445984, + "mean_norm/layer2": 9.167939245700836, + "mean_norm/layer20": 11.580475270748138, + "mean_norm/layer21": 11.548064768314362, + "mean_norm/layer22": 12.781589150428772, + "mean_norm/layer23": 12.736304581165314, + "mean_norm/layer3": 12.26003360748291, + "mean_norm/layer4": 10.674065291881561, + "mean_norm/layer5": 13.787844359874725, + "mean_norm/layer6": 10.04273635149002, + "mean_norm/layer7": 10.709193885326385, + "mean_norm/layer8": 11.318026006221771, + "mean_norm/layer9": 11.22526466846466, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13800 + }, + { + "epoch": 5.76, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4695935394637041, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7042880058288574, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8457, + "eval_samples_per_second": 20.345, + "eval_steps_per_second": 0.675, + "step": 13800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.78, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4311, + "max_norm": 42.867034912109375, + "max_norm/layer0": 32.59137725830078, + "max_norm/layer1": 34.52602767944336, + "max_norm/layer10": 36.34048080444336, + "max_norm/layer11": 33.140743255615234, + "max_norm/layer12": 38.443443298339844, + "max_norm/layer13": 33.72990798950195, + "max_norm/layer14": 34.72901916503906, + "max_norm/layer15": 42.37352752685547, + "max_norm/layer16": 34.81253433227539, + "max_norm/layer17": 42.867034912109375, + "max_norm/layer18": 37.07355499267578, + "max_norm/layer19": 36.49341583251953, + "max_norm/layer2": 25.837297439575195, + "max_norm/layer20": 36.53437042236328, + "max_norm/layer21": 36.775245666503906, + "max_norm/layer22": 37.215858459472656, + "max_norm/layer23": 35.314640045166016, + "max_norm/layer3": 32.82737731933594, + "max_norm/layer4": 32.852108001708984, + "max_norm/layer5": 41.8297233581543, + "max_norm/layer6": 27.339946746826172, + "max_norm/layer7": 35.94553756713867, + "max_norm/layer8": 34.851322174072266, + "max_norm/layer9": 35.35096740722656, + "mean_norm": 11.571596026420593, + "mean_norm/layer0": 11.438275337219238, + "mean_norm/layer1": 11.008784472942352, + "mean_norm/layer10": 11.328203916549683, + "mean_norm/layer11": 11.732258260250092, + "mean_norm/layer12": 12.495415687561035, + "mean_norm/layer13": 11.360939621925354, + "mean_norm/layer14": 11.821831226348877, + "mean_norm/layer15": 12.269017338752747, + "mean_norm/layer16": 11.429407954216003, + "mean_norm/layer17": 11.99849796295166, + "mean_norm/layer18": 11.406443893909454, + "mean_norm/layer19": 11.4840726852417, + "mean_norm/layer2": 9.171578586101532, + "mean_norm/layer20": 11.589037954807281, + "mean_norm/layer21": 11.55676382780075, + "mean_norm/layer22": 12.793222546577454, + "mean_norm/layer23": 12.748144805431366, + "mean_norm/layer3": 12.27302098274231, + "mean_norm/layer4": 10.68181574344635, + "mean_norm/layer5": 13.804852664470673, + "mean_norm/layer6": 10.048506796360016, + "mean_norm/layer7": 10.716846406459808, + "mean_norm/layer8": 11.327199518680573, + "mean_norm/layer9": 11.234166443347931, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13850 + }, + { + "epoch": 5.78, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4705913370081487, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7011148929595947, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6359, + "eval_samples_per_second": 20.712, + "eval_steps_per_second": 0.688, + "step": 13850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.8, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4379, + "max_norm": 42.9991340637207, + "max_norm/layer0": 32.67675018310547, + "max_norm/layer1": 34.62179183959961, + "max_norm/layer10": 36.44373321533203, + "max_norm/layer11": 33.20524978637695, + "max_norm/layer12": 38.551753997802734, + "max_norm/layer13": 33.821502685546875, + "max_norm/layer14": 34.808998107910156, + "max_norm/layer15": 42.49689483642578, + "max_norm/layer16": 34.90584182739258, + "max_norm/layer17": 42.9991340637207, + "max_norm/layer18": 37.173526763916016, + "max_norm/layer19": 36.60969161987305, + "max_norm/layer2": 25.892879486083984, + "max_norm/layer20": 36.612857818603516, + "max_norm/layer21": 36.875526428222656, + "max_norm/layer22": 37.30345153808594, + "max_norm/layer23": 35.393680572509766, + "max_norm/layer3": 32.886417388916016, + "max_norm/layer4": 32.9256591796875, + "max_norm/layer5": 41.92585372924805, + "max_norm/layer6": 27.39628028869629, + "max_norm/layer7": 36.030879974365234, + "max_norm/layer8": 34.93297576904297, + "max_norm/layer9": 35.42243194580078, + "mean_norm": 11.581335020562014, + "mean_norm/layer0": 11.45145434141159, + "mean_norm/layer1": 11.018277168273926, + "mean_norm/layer10": 11.33707845211029, + "mean_norm/layer11": 11.742176473140717, + "mean_norm/layer12": 12.507989645004272, + "mean_norm/layer13": 11.370223939418793, + "mean_norm/layer14": 11.831981182098389, + "mean_norm/layer15": 12.280655086040497, + "mean_norm/layer16": 11.438491344451904, + "mean_norm/layer17": 12.00839626789093, + "mean_norm/layer18": 11.414667963981628, + "mean_norm/layer19": 11.49258005619049, + "mean_norm/layer2": 9.175205826759338, + "mean_norm/layer20": 11.597498834133148, + "mean_norm/layer21": 11.565355122089386, + "mean_norm/layer22": 12.804871678352356, + "mean_norm/layer23": 12.75985324382782, + "mean_norm/layer3": 12.285956501960754, + "mean_norm/layer4": 10.689500033855438, + "mean_norm/layer5": 13.821775257587433, + "mean_norm/layer6": 10.054342985153198, + "mean_norm/layer7": 10.724383294582367, + "mean_norm/layer8": 11.336312234401703, + "mean_norm/layer9": 11.243013560771942, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13900 + }, + { + "epoch": 5.8, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47070085137278284, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7012670040130615, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8509, + "eval_samples_per_second": 20.336, + "eval_steps_per_second": 0.675, + "step": 13900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.82, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4347, + "max_norm": 43.10231018066406, + "max_norm/layer0": 32.753517150878906, + "max_norm/layer1": 34.715728759765625, + "max_norm/layer10": 36.539344787597656, + "max_norm/layer11": 33.28629684448242, + "max_norm/layer12": 38.66322326660156, + "max_norm/layer13": 33.89580535888672, + "max_norm/layer14": 34.89205551147461, + "max_norm/layer15": 42.609230041503906, + "max_norm/layer16": 35.00455093383789, + "max_norm/layer17": 43.10231018066406, + "max_norm/layer18": 37.268592834472656, + "max_norm/layer19": 36.70490646362305, + "max_norm/layer2": 25.953227996826172, + "max_norm/layer20": 36.691898345947266, + "max_norm/layer21": 36.96839904785156, + "max_norm/layer22": 37.388004302978516, + "max_norm/layer23": 35.4702262878418, + "max_norm/layer3": 32.95038604736328, + "max_norm/layer4": 32.99562454223633, + "max_norm/layer5": 42.026756286621094, + "max_norm/layer6": 27.448122024536133, + "max_norm/layer7": 36.12428665161133, + "max_norm/layer8": 35.01604080200195, + "max_norm/layer9": 35.487979888916016, + "mean_norm": 11.591110952198505, + "mean_norm/layer0": 11.464677512645721, + "mean_norm/layer1": 11.027840971946716, + "mean_norm/layer10": 11.345887303352356, + "mean_norm/layer11": 11.752020120620728, + "mean_norm/layer12": 12.520609438419342, + "mean_norm/layer13": 11.379559338092804, + "mean_norm/layer14": 11.842145323753357, + "mean_norm/layer15": 12.29226964712143, + "mean_norm/layer16": 11.447559237480164, + "mean_norm/layer17": 12.018401503562927, + "mean_norm/layer18": 11.422959864139557, + "mean_norm/layer19": 11.501260638237, + "mean_norm/layer2": 9.178790748119354, + "mean_norm/layer20": 11.605934798717499, + "mean_norm/layer21": 11.574039816856384, + "mean_norm/layer22": 12.816502630710602, + "mean_norm/layer23": 12.771722674369812, + "mean_norm/layer3": 12.298872590065002, + "mean_norm/layer4": 10.697331547737122, + "mean_norm/layer5": 13.838718593120575, + "mean_norm/layer6": 10.060210466384888, + "mean_norm/layer7": 10.731984496116638, + "mean_norm/layer8": 11.345423817634583, + "mean_norm/layer9": 11.25193977355957, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 13950 + }, + { + "epoch": 5.82, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4698206803681305, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7006213665008545, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8275, + "eval_samples_per_second": 22.258, + "eval_steps_per_second": 0.739, + "step": 13950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.85, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4341, + "max_norm": 43.21664810180664, + "max_norm/layer0": 32.8301887512207, + "max_norm/layer1": 34.805118560791016, + "max_norm/layer10": 36.62165832519531, + "max_norm/layer11": 33.37471389770508, + "max_norm/layer12": 38.779029846191406, + "max_norm/layer13": 33.97347640991211, + "max_norm/layer14": 34.97389221191406, + "max_norm/layer15": 42.710960388183594, + "max_norm/layer16": 35.09590148925781, + "max_norm/layer17": 43.21664810180664, + "max_norm/layer18": 37.33848571777344, + "max_norm/layer19": 36.80155563354492, + "max_norm/layer2": 26.006290435791016, + "max_norm/layer20": 36.775001525878906, + "max_norm/layer21": 37.05457305908203, + "max_norm/layer22": 37.47380828857422, + "max_norm/layer23": 35.542789459228516, + "max_norm/layer3": 33.01007843017578, + "max_norm/layer4": 33.06580352783203, + "max_norm/layer5": 42.12410354614258, + "max_norm/layer6": 27.502948760986328, + "max_norm/layer7": 36.20676803588867, + "max_norm/layer8": 35.10688781738281, + "max_norm/layer9": 35.55755615234375, + "mean_norm": 11.6008760035038, + "mean_norm/layer0": 11.477870464324951, + "mean_norm/layer1": 11.037355363368988, + "mean_norm/layer10": 11.354801952838898, + "mean_norm/layer11": 11.761891961097717, + "mean_norm/layer12": 12.533324897289276, + "mean_norm/layer13": 11.388908922672272, + "mean_norm/layer14": 11.852356672286987, + "mean_norm/layer15": 12.303934931755066, + "mean_norm/layer16": 11.456604540348053, + "mean_norm/layer17": 12.028372943401337, + "mean_norm/layer18": 11.431184530258179, + "mean_norm/layer19": 11.509862244129181, + "mean_norm/layer2": 9.182381510734558, + "mean_norm/layer20": 11.614325940608978, + "mean_norm/layer21": 11.582619071006775, + "mean_norm/layer22": 12.828144192695618, + "mean_norm/layer23": 12.783535063266754, + "mean_norm/layer3": 12.311726570129395, + "mean_norm/layer4": 10.705096662044525, + "mean_norm/layer5": 13.85563451051712, + "mean_norm/layer6": 10.06605577468872, + "mean_norm/layer7": 10.73960566520691, + "mean_norm/layer8": 11.35459178686142, + "mean_norm/layer9": 11.26083791255951, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14000 + }, + { + "epoch": 5.85, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4700478212725569, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6960055828094482, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8363, + "eval_samples_per_second": 20.361, + "eval_steps_per_second": 0.676, + "step": 14000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.87, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4387, + "max_norm": 43.33818435668945, + "max_norm/layer0": 32.90453338623047, + "max_norm/layer1": 34.89594650268555, + "max_norm/layer10": 36.70533752441406, + "max_norm/layer11": 33.45826721191406, + "max_norm/layer12": 38.879756927490234, + "max_norm/layer13": 34.05232620239258, + "max_norm/layer14": 35.064571380615234, + "max_norm/layer15": 42.82941436767578, + "max_norm/layer16": 35.18965530395508, + "max_norm/layer17": 43.33818435668945, + "max_norm/layer18": 37.43769073486328, + "max_norm/layer19": 36.90222930908203, + "max_norm/layer2": 26.053985595703125, + "max_norm/layer20": 36.861148834228516, + "max_norm/layer21": 37.14982223510742, + "max_norm/layer22": 37.572227478027344, + "max_norm/layer23": 35.62480545043945, + "max_norm/layer3": 33.07106399536133, + "max_norm/layer4": 33.13713836669922, + "max_norm/layer5": 42.22083282470703, + "max_norm/layer6": 27.555927276611328, + "max_norm/layer7": 36.295875549316406, + "max_norm/layer8": 35.1954345703125, + "max_norm/layer9": 35.63373947143555, + "mean_norm": 11.610697651902834, + "mean_norm/layer0": 11.491089403629303, + "mean_norm/layer1": 11.046924233436584, + "mean_norm/layer10": 11.363676011562347, + "mean_norm/layer11": 11.771858751773834, + "mean_norm/layer12": 12.546132445335388, + "mean_norm/layer13": 11.398319244384766, + "mean_norm/layer14": 11.862588167190552, + "mean_norm/layer15": 12.315575361251831, + "mean_norm/layer16": 11.465714812278748, + "mean_norm/layer17": 12.038424968719482, + "mean_norm/layer18": 11.43947297334671, + "mean_norm/layer19": 11.518530130386353, + "mean_norm/layer2": 9.186090588569641, + "mean_norm/layer20": 11.622918426990509, + "mean_norm/layer21": 11.591268122196198, + "mean_norm/layer22": 12.839798271656036, + "mean_norm/layer23": 12.795412421226501, + "mean_norm/layer3": 12.324716210365295, + "mean_norm/layer4": 10.712847471237183, + "mean_norm/layer5": 13.872604966163635, + "mean_norm/layer6": 10.071965157985687, + "mean_norm/layer7": 10.7472425699234, + "mean_norm/layer8": 11.36383306980133, + "mean_norm/layer9": 11.269739866256714, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14050 + }, + { + "epoch": 5.87, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46974767079170776, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6960787773132324, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6345, + "eval_samples_per_second": 20.714, + "eval_steps_per_second": 0.688, + "step": 14050 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.89, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4431, + "max_norm": 43.441749572753906, + "max_norm/layer0": 32.974632263183594, + "max_norm/layer1": 34.989437103271484, + "max_norm/layer10": 36.79485321044922, + "max_norm/layer11": 33.53351974487305, + "max_norm/layer12": 38.98495864868164, + "max_norm/layer13": 34.13669967651367, + "max_norm/layer14": 35.149986267089844, + "max_norm/layer15": 42.9059944152832, + "max_norm/layer16": 35.27094650268555, + "max_norm/layer17": 43.441749572753906, + "max_norm/layer18": 37.5269775390625, + "max_norm/layer19": 36.99470901489258, + "max_norm/layer2": 26.092681884765625, + "max_norm/layer20": 36.94902038574219, + "max_norm/layer21": 37.251434326171875, + "max_norm/layer22": 37.671112060546875, + "max_norm/layer23": 35.70341873168945, + "max_norm/layer3": 33.13298416137695, + "max_norm/layer4": 33.20835876464844, + "max_norm/layer5": 42.318687438964844, + "max_norm/layer6": 27.600130081176758, + "max_norm/layer7": 36.378604888916016, + "max_norm/layer8": 35.283470153808594, + "max_norm/layer9": 35.7142219543457, + "mean_norm": 11.620416504641375, + "mean_norm/layer0": 11.5041783452034, + "mean_norm/layer1": 11.056489646434784, + "mean_norm/layer10": 11.372434675693512, + "mean_norm/layer11": 11.781669199466705, + "mean_norm/layer12": 12.558667540550232, + "mean_norm/layer13": 11.407612383365631, + "mean_norm/layer14": 11.872676074504852, + "mean_norm/layer15": 12.327141106128693, + "mean_norm/layer16": 11.474704504013062, + "mean_norm/layer17": 12.04838103055954, + "mean_norm/layer18": 11.447708785533905, + "mean_norm/layer19": 11.527015447616577, + "mean_norm/layer2": 9.189803123474121, + "mean_norm/layer20": 11.631482064723969, + "mean_norm/layer21": 11.599860608577728, + "mean_norm/layer22": 12.851312100887299, + "mean_norm/layer23": 12.807093441486359, + "mean_norm/layer3": 12.337528228759766, + "mean_norm/layer4": 10.720510184764862, + "mean_norm/layer5": 13.889585733413696, + "mean_norm/layer6": 10.077845275402069, + "mean_norm/layer7": 10.75475662946701, + "mean_norm/layer8": 11.372963190078735, + "mean_norm/layer9": 11.278576791286469, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14100 + }, + { + "epoch": 5.89, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47030335479003665, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6899490356445312, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8606, + "eval_samples_per_second": 20.319, + "eval_steps_per_second": 0.675, + "step": 14100 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.91, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4324, + "max_norm": 43.548465728759766, + "max_norm/layer0": 33.051536560058594, + "max_norm/layer1": 35.0789794921875, + "max_norm/layer10": 36.88705062866211, + "max_norm/layer11": 33.60562515258789, + "max_norm/layer12": 39.086647033691406, + "max_norm/layer13": 34.211490631103516, + "max_norm/layer14": 35.24163818359375, + "max_norm/layer15": 43.00029373168945, + "max_norm/layer16": 35.36878967285156, + "max_norm/layer17": 43.548465728759766, + "max_norm/layer18": 37.62931823730469, + "max_norm/layer19": 37.08994674682617, + "max_norm/layer2": 26.14853858947754, + "max_norm/layer20": 37.03773498535156, + "max_norm/layer21": 37.34528732299805, + "max_norm/layer22": 37.75578308105469, + "max_norm/layer23": 35.7780647277832, + "max_norm/layer3": 33.202308654785156, + "max_norm/layer4": 33.26975631713867, + "max_norm/layer5": 42.42267990112305, + "max_norm/layer6": 27.656192779541016, + "max_norm/layer7": 36.4588508605957, + "max_norm/layer8": 35.362754821777344, + "max_norm/layer9": 35.800048828125, + "mean_norm": 11.630185887217522, + "mean_norm/layer0": 11.517368972301483, + "mean_norm/layer1": 11.066060483455658, + "mean_norm/layer10": 11.381290197372437, + "mean_norm/layer11": 11.791641652584076, + "mean_norm/layer12": 12.57132887840271, + "mean_norm/layer13": 11.416931986808777, + "mean_norm/layer14": 11.882811486721039, + "mean_norm/layer15": 12.338815450668335, + "mean_norm/layer16": 11.483754396438599, + "mean_norm/layer17": 12.058379352092743, + "mean_norm/layer18": 11.456011533737183, + "mean_norm/layer19": 11.535554885864258, + "mean_norm/layer2": 9.193414986133575, + "mean_norm/layer20": 11.639894902706146, + "mean_norm/layer21": 11.608478248119354, + "mean_norm/layer22": 12.862938106060028, + "mean_norm/layer23": 12.818759024143219, + "mean_norm/layer3": 12.350463688373566, + "mean_norm/layer4": 10.728277564048767, + "mean_norm/layer5": 13.906632900238037, + "mean_norm/layer6": 10.083712875843048, + "mean_norm/layer7": 10.76239389181137, + "mean_norm/layer8": 11.382040023803711, + "mean_norm/layer9": 11.287505805492401, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14150 + }, + { + "epoch": 5.91, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47015327954961206, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6898772716522217, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6405, + "eval_samples_per_second": 20.704, + "eval_steps_per_second": 0.687, + "step": 14150 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.93, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4488, + "max_norm": 43.65976333618164, + "max_norm/layer0": 33.13996124267578, + "max_norm/layer1": 35.17390823364258, + "max_norm/layer10": 36.97819137573242, + "max_norm/layer11": 33.683189392089844, + "max_norm/layer12": 39.19681930541992, + "max_norm/layer13": 34.28578186035156, + "max_norm/layer14": 35.341121673583984, + "max_norm/layer15": 43.115135192871094, + "max_norm/layer16": 35.4621696472168, + "max_norm/layer17": 43.65976333618164, + "max_norm/layer18": 37.73054122924805, + "max_norm/layer19": 37.18355178833008, + "max_norm/layer2": 26.213022232055664, + "max_norm/layer20": 37.11777877807617, + "max_norm/layer21": 37.44013595581055, + "max_norm/layer22": 37.8612060546875, + "max_norm/layer23": 35.86772155761719, + "max_norm/layer3": 33.270999908447266, + "max_norm/layer4": 33.32688903808594, + "max_norm/layer5": 42.53396224975586, + "max_norm/layer6": 27.718505859375, + "max_norm/layer7": 36.53450012207031, + "max_norm/layer8": 35.450984954833984, + "max_norm/layer9": 35.87091827392578, + "mean_norm": 11.639934313793978, + "mean_norm/layer0": 11.53043419122696, + "mean_norm/layer1": 11.07560282945633, + "mean_norm/layer10": 11.390058994293213, + "mean_norm/layer11": 11.80152678489685, + "mean_norm/layer12": 12.583993315696716, + "mean_norm/layer13": 11.426232159137726, + "mean_norm/layer14": 11.89290964603424, + "mean_norm/layer15": 12.35047596693039, + "mean_norm/layer16": 11.492808818817139, + "mean_norm/layer17": 12.068269491195679, + "mean_norm/layer18": 11.464175939559937, + "mean_norm/layer19": 11.544139325618744, + "mean_norm/layer2": 9.197042524814606, + "mean_norm/layer20": 11.648470103740692, + "mean_norm/layer21": 11.617040514945984, + "mean_norm/layer22": 12.874555885791779, + "mean_norm/layer23": 12.830484867095947, + "mean_norm/layer3": 12.363328337669373, + "mean_norm/layer4": 10.736116528511047, + "mean_norm/layer5": 13.923593997955322, + "mean_norm/layer6": 10.089556813240051, + "mean_norm/layer7": 10.770008206367493, + "mean_norm/layer8": 11.39112776517868, + "mean_norm/layer9": 11.296470522880554, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14200 + }, + { + "epoch": 5.93, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.47055888830751635, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.69054913520813, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8311, + "eval_samples_per_second": 20.37, + "eval_steps_per_second": 0.676, + "step": 14200 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.95, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4344, + "max_norm": 43.770164489746094, + "max_norm/layer0": 33.20868682861328, + "max_norm/layer1": 35.26812744140625, + "max_norm/layer10": 37.083702087402344, + "max_norm/layer11": 33.75374984741211, + "max_norm/layer12": 39.29998779296875, + "max_norm/layer13": 34.36618423461914, + "max_norm/layer14": 35.43849563598633, + "max_norm/layer15": 43.22459411621094, + "max_norm/layer16": 35.54741287231445, + "max_norm/layer17": 43.770164489746094, + "max_norm/layer18": 37.811466217041016, + "max_norm/layer19": 37.2822380065918, + "max_norm/layer2": 26.2640323638916, + "max_norm/layer20": 37.19891357421875, + "max_norm/layer21": 37.527061462402344, + "max_norm/layer22": 37.950984954833984, + "max_norm/layer23": 35.96153259277344, + "max_norm/layer3": 33.3438606262207, + "max_norm/layer4": 33.387088775634766, + "max_norm/layer5": 42.64588165283203, + "max_norm/layer6": 27.77462387084961, + "max_norm/layer7": 36.612342834472656, + "max_norm/layer8": 35.532344818115234, + "max_norm/layer9": 35.93207550048828, + "mean_norm": 11.649720599253973, + "mean_norm/layer0": 11.54356062412262, + "mean_norm/layer1": 11.084979772567749, + "mean_norm/layer10": 11.398874163627625, + "mean_norm/layer11": 11.811476826667786, + "mean_norm/layer12": 12.596729159355164, + "mean_norm/layer13": 11.4356250166893, + "mean_norm/layer14": 11.903102099895477, + "mean_norm/layer15": 12.362160086631775, + "mean_norm/layer16": 11.501914262771606, + "mean_norm/layer17": 12.078312635421753, + "mean_norm/layer18": 11.47243356704712, + "mean_norm/layer19": 11.55273050069809, + "mean_norm/layer2": 9.200705409049988, + "mean_norm/layer20": 11.65684986114502, + "mean_norm/layer21": 11.6256822347641, + "mean_norm/layer22": 12.886271953582764, + "mean_norm/layer23": 12.842396259307861, + "mean_norm/layer3": 12.376322150230408, + "mean_norm/layer4": 10.743931829929352, + "mean_norm/layer5": 13.940525889396667, + "mean_norm/layer6": 10.095376551151276, + "mean_norm/layer7": 10.777623057365417, + "mean_norm/layer8": 11.400293707847595, + "mean_norm/layer9": 11.305416762828827, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14250 + }, + { + "epoch": 5.95, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4709604409778416, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.693927764892578, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8382, + "eval_samples_per_second": 20.358, + "eval_steps_per_second": 0.676, + "step": 14250 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.97, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4414, + "max_norm": 43.877471923828125, + "max_norm/layer0": 33.2783317565918, + "max_norm/layer1": 35.36090850830078, + "max_norm/layer10": 37.202369689941406, + "max_norm/layer11": 33.82597351074219, + "max_norm/layer12": 39.39459991455078, + "max_norm/layer13": 34.450408935546875, + "max_norm/layer14": 35.524879455566406, + "max_norm/layer15": 43.33192825317383, + "max_norm/layer16": 35.63564682006836, + "max_norm/layer17": 43.877471923828125, + "max_norm/layer18": 37.90175247192383, + "max_norm/layer19": 37.37932586669922, + "max_norm/layer2": 26.314382553100586, + "max_norm/layer20": 37.288143157958984, + "max_norm/layer21": 37.59833526611328, + "max_norm/layer22": 38.0389289855957, + "max_norm/layer23": 36.04848098754883, + "max_norm/layer3": 33.40947723388672, + "max_norm/layer4": 33.448463439941406, + "max_norm/layer5": 42.75556182861328, + "max_norm/layer6": 27.835750579833984, + "max_norm/layer7": 36.69871139526367, + "max_norm/layer8": 35.61986541748047, + "max_norm/layer9": 35.991172790527344, + "mean_norm": 11.65939316401879, + "mean_norm/layer0": 11.556526839733124, + "mean_norm/layer1": 11.094407200813293, + "mean_norm/layer10": 11.407621800899506, + "mean_norm/layer11": 11.821186006069183, + "mean_norm/layer12": 12.609242022037506, + "mean_norm/layer13": 11.444914400577545, + "mean_norm/layer14": 11.913126409053802, + "mean_norm/layer15": 12.373706638813019, + "mean_norm/layer16": 11.510907769203186, + "mean_norm/layer17": 12.088223099708557, + "mean_norm/layer18": 11.480640769004822, + "mean_norm/layer19": 11.561327338218689, + "mean_norm/layer2": 9.204297006130219, + "mean_norm/layer20": 11.66532027721405, + "mean_norm/layer21": 11.63420432806015, + "mean_norm/layer22": 12.89782601594925, + "mean_norm/layer23": 12.85407680273056, + "mean_norm/layer3": 12.389108657836914, + "mean_norm/layer4": 10.751596450805664, + "mean_norm/layer5": 13.9572993516922, + "mean_norm/layer6": 10.101068377494812, + "mean_norm/layer7": 10.785195469856262, + "mean_norm/layer8": 11.409336149692535, + "mean_norm/layer9": 11.31427675485611, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14300 + }, + { + "epoch": 5.97, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.471937958084391, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.687013626098633, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6223, + "eval_samples_per_second": 20.736, + "eval_steps_per_second": 0.688, + "step": 14300 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 5.99, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.4437, + "max_norm": 43.989898681640625, + "max_norm/layer0": 33.34931564331055, + "max_norm/layer1": 35.46033477783203, + "max_norm/layer10": 37.316829681396484, + "max_norm/layer11": 33.88945007324219, + "max_norm/layer12": 39.5078125, + "max_norm/layer13": 34.53520965576172, + "max_norm/layer14": 35.60698699951172, + "max_norm/layer15": 43.46208953857422, + "max_norm/layer16": 35.72053527832031, + "max_norm/layer17": 43.989898681640625, + "max_norm/layer18": 37.99073028564453, + "max_norm/layer19": 37.48189163208008, + "max_norm/layer2": 26.361745834350586, + "max_norm/layer20": 37.369483947753906, + "max_norm/layer21": 37.68265151977539, + "max_norm/layer22": 38.128868103027344, + "max_norm/layer23": 36.1319465637207, + "max_norm/layer3": 33.48076248168945, + "max_norm/layer4": 33.50715255737305, + "max_norm/layer5": 42.86227035522461, + "max_norm/layer6": 27.901187896728516, + "max_norm/layer7": 36.785762786865234, + "max_norm/layer8": 35.692440032958984, + "max_norm/layer9": 36.05787658691406, + "mean_norm": 11.669073348244032, + "mean_norm/layer0": 11.569561958312988, + "mean_norm/layer1": 11.103819906711578, + "mean_norm/layer10": 11.41639906167984, + "mean_norm/layer11": 11.830869317054749, + "mean_norm/layer12": 12.621800243854523, + "mean_norm/layer13": 11.454206645488739, + "mean_norm/layer14": 11.923109650611877, + "mean_norm/layer15": 12.385221660137177, + "mean_norm/layer16": 11.519890904426575, + "mean_norm/layer17": 12.098167896270752, + "mean_norm/layer18": 11.488867819309235, + "mean_norm/layer19": 11.569864094257355, + "mean_norm/layer2": 9.207905173301697, + "mean_norm/layer20": 11.673797130584717, + "mean_norm/layer21": 11.642704725265503, + "mean_norm/layer22": 12.909379720687866, + "mean_norm/layer23": 12.865759074687958, + "mean_norm/layer3": 12.401918411254883, + "mean_norm/layer4": 10.759348154067993, + "mean_norm/layer5": 13.974067091941833, + "mean_norm/layer6": 10.10683810710907, + "mean_norm/layer7": 10.79275369644165, + "mean_norm/layer8": 11.41837626695633, + "mean_norm/layer9": 11.323133647441864, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14350 + }, + { + "epoch": 5.99, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4716945928296484, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.6884405612945557, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8294, + "eval_samples_per_second": 20.373, + "eval_steps_per_second": 0.676, + "step": 14350 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.01, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3129, + "max_norm": 44.09721374511719, + "max_norm/layer0": 33.424678802490234, + "max_norm/layer1": 35.5435676574707, + "max_norm/layer10": 37.4267578125, + "max_norm/layer11": 33.97317123413086, + "max_norm/layer12": 39.60700225830078, + "max_norm/layer13": 34.626312255859375, + "max_norm/layer14": 35.68148422241211, + "max_norm/layer15": 43.590301513671875, + "max_norm/layer16": 35.797027587890625, + "max_norm/layer17": 44.09721374511719, + "max_norm/layer18": 38.072628021240234, + "max_norm/layer19": 37.573429107666016, + "max_norm/layer2": 26.40358543395996, + "max_norm/layer20": 37.452476501464844, + "max_norm/layer21": 37.774017333984375, + "max_norm/layer22": 38.23457717895508, + "max_norm/layer23": 36.20406723022461, + "max_norm/layer3": 33.54252243041992, + "max_norm/layer4": 33.57847213745117, + "max_norm/layer5": 42.95096969604492, + "max_norm/layer6": 27.952163696289062, + "max_norm/layer7": 36.872596740722656, + "max_norm/layer8": 35.75625228881836, + "max_norm/layer9": 36.12723922729492, + "mean_norm": 11.678674280643463, + "mean_norm/layer0": 11.582400023937225, + "mean_norm/layer1": 11.113045513629913, + "mean_norm/layer10": 11.425013542175293, + "mean_norm/layer11": 11.840567767620087, + "mean_norm/layer12": 12.634274005889893, + "mean_norm/layer13": 11.463509678840637, + "mean_norm/layer14": 11.933098912239075, + "mean_norm/layer15": 12.396642088890076, + "mean_norm/layer16": 11.528850138187408, + "mean_norm/layer17": 12.10803872346878, + "mean_norm/layer18": 11.497036457061768, + "mean_norm/layer19": 11.578483283519745, + "mean_norm/layer2": 9.21142292022705, + "mean_norm/layer20": 11.682356297969818, + "mean_norm/layer21": 11.651371657848358, + "mean_norm/layer22": 12.920911967754364, + "mean_norm/layer23": 12.877335011959076, + "mean_norm/layer3": 12.414536356925964, + "mean_norm/layer4": 10.766944766044617, + "mean_norm/layer5": 13.990516602993011, + "mean_norm/layer6": 10.112547993659973, + "mean_norm/layer7": 10.800214946269989, + "mean_norm/layer8": 11.427287995815277, + "mean_norm/layer9": 11.331776082515717, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14400 + }, + { + "epoch": 6.01, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46913520156727223, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7376086711883545, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6168, + "eval_samples_per_second": 20.746, + "eval_steps_per_second": 0.689, + "step": 14400 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.03, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2464, + "max_norm": 44.224796295166016, + "max_norm/layer0": 33.49764633178711, + "max_norm/layer1": 35.63376235961914, + "max_norm/layer10": 37.52918243408203, + "max_norm/layer11": 34.06564712524414, + "max_norm/layer12": 39.712989807128906, + "max_norm/layer13": 34.71847915649414, + "max_norm/layer14": 35.767826080322266, + "max_norm/layer15": 43.719058990478516, + "max_norm/layer16": 35.88226318359375, + "max_norm/layer17": 44.224796295166016, + "max_norm/layer18": 38.1541633605957, + "max_norm/layer19": 37.67153549194336, + "max_norm/layer2": 26.451637268066406, + "max_norm/layer20": 37.53163528442383, + "max_norm/layer21": 37.86661148071289, + "max_norm/layer22": 38.343509674072266, + "max_norm/layer23": 36.274871826171875, + "max_norm/layer3": 33.602134704589844, + "max_norm/layer4": 33.64577102661133, + "max_norm/layer5": 43.04342269897461, + "max_norm/layer6": 28.01210594177246, + "max_norm/layer7": 36.95952606201172, + "max_norm/layer8": 35.837249755859375, + "max_norm/layer9": 36.20220947265625, + "mean_norm": 11.688791334629059, + "mean_norm/layer0": 11.596086919307709, + "mean_norm/layer1": 11.122628390789032, + "mean_norm/layer10": 11.433982729911804, + "mean_norm/layer11": 11.85074108839035, + "mean_norm/layer12": 12.647378921508789, + "mean_norm/layer13": 11.473222136497498, + "mean_norm/layer14": 11.943670928478241, + "mean_norm/layer15": 12.408711671829224, + "mean_norm/layer16": 11.538374602794647, + "mean_norm/layer17": 12.11855924129486, + "mean_norm/layer18": 11.505737960338593, + "mean_norm/layer19": 11.587811827659607, + "mean_norm/layer2": 9.215099394321442, + "mean_norm/layer20": 11.691645443439484, + "mean_norm/layer21": 11.660697937011719, + "mean_norm/layer22": 12.93289566040039, + "mean_norm/layer23": 12.889711081981659, + "mean_norm/layer3": 12.427682518959045, + "mean_norm/layer4": 10.774953126907349, + "mean_norm/layer5": 14.00755500793457, + "mean_norm/layer6": 10.118492186069489, + "mean_norm/layer7": 10.80799287557602, + "mean_norm/layer8": 11.436597108840942, + "mean_norm/layer9": 11.34076327085495, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14450 + }, + { + "epoch": 6.03, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46790215094324317, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.740433931350708, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8406, + "eval_samples_per_second": 20.354, + "eval_steps_per_second": 0.676, + "step": 14450 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.05, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2476, + "max_norm": 44.33781433105469, + "max_norm/layer0": 33.578407287597656, + "max_norm/layer1": 35.71784591674805, + "max_norm/layer10": 37.634239196777344, + "max_norm/layer11": 34.15476989746094, + "max_norm/layer12": 39.832733154296875, + "max_norm/layer13": 34.81980895996094, + "max_norm/layer14": 35.85801315307617, + "max_norm/layer15": 43.835697174072266, + "max_norm/layer16": 35.963539123535156, + "max_norm/layer17": 44.33781433105469, + "max_norm/layer18": 38.23371505737305, + "max_norm/layer19": 37.796539306640625, + "max_norm/layer2": 26.483850479125977, + "max_norm/layer20": 37.608795166015625, + "max_norm/layer21": 37.96210479736328, + "max_norm/layer22": 38.45704650878906, + "max_norm/layer23": 36.3537483215332, + "max_norm/layer3": 33.67289352416992, + "max_norm/layer4": 33.70362091064453, + "max_norm/layer5": 43.14081954956055, + "max_norm/layer6": 28.07660675048828, + "max_norm/layer7": 37.03910827636719, + "max_norm/layer8": 35.92915344238281, + "max_norm/layer9": 36.28647994995117, + "mean_norm": 11.698854426542917, + "mean_norm/layer0": 11.610015153884888, + "mean_norm/layer1": 11.13212662935257, + "mean_norm/layer10": 11.442975342273712, + "mean_norm/layer11": 11.860947608947754, + "mean_norm/layer12": 12.660435795783997, + "mean_norm/layer13": 11.48287183046341, + "mean_norm/layer14": 11.95419842004776, + "mean_norm/layer15": 12.420693695545197, + "mean_norm/layer16": 11.547771215438843, + "mean_norm/layer17": 12.128973543643951, + "mean_norm/layer18": 11.514398634433746, + "mean_norm/layer19": 11.597030580043793, + "mean_norm/layer2": 9.21879118680954, + "mean_norm/layer20": 11.70077121257782, + "mean_norm/layer21": 11.669915497303009, + "mean_norm/layer22": 12.944676518440247, + "mean_norm/layer23": 12.901835203170776, + "mean_norm/layer3": 12.440813302993774, + "mean_norm/layer4": 10.78300029039383, + "mean_norm/layer5": 14.02452540397644, + "mean_norm/layer6": 10.124517142772675, + "mean_norm/layer7": 10.815687239170074, + "mean_norm/layer8": 11.445838451385498, + "mean_norm/layer9": 11.349696338176727, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14500 + }, + { + "epoch": 6.05, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46863630279505, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7320709228515625, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8508, + "eval_samples_per_second": 20.336, + "eval_steps_per_second": 0.675, + "step": 14500 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.08, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2637, + "max_norm": 44.466896057128906, + "max_norm/layer0": 33.65315246582031, + "max_norm/layer1": 35.79899597167969, + "max_norm/layer10": 37.72567367553711, + "max_norm/layer11": 34.24459457397461, + "max_norm/layer12": 39.92678451538086, + "max_norm/layer13": 34.91712188720703, + "max_norm/layer14": 35.933841705322266, + "max_norm/layer15": 43.96389389038086, + "max_norm/layer16": 36.0675163269043, + "max_norm/layer17": 44.466896057128906, + "max_norm/layer18": 38.311832427978516, + "max_norm/layer19": 37.89857864379883, + "max_norm/layer2": 26.51372528076172, + "max_norm/layer20": 37.69976806640625, + "max_norm/layer21": 38.0622673034668, + "max_norm/layer22": 38.56037521362305, + "max_norm/layer23": 36.4434928894043, + "max_norm/layer3": 33.747703552246094, + "max_norm/layer4": 33.77354049682617, + "max_norm/layer5": 43.23781204223633, + "max_norm/layer6": 28.13241958618164, + "max_norm/layer7": 37.13059997558594, + "max_norm/layer8": 36.016422271728516, + "max_norm/layer9": 36.36855697631836, + "mean_norm": 11.708862346907457, + "mean_norm/layer0": 11.624148964881897, + "mean_norm/layer1": 11.141570508480072, + "mean_norm/layer10": 11.451896965503693, + "mean_norm/layer11": 11.871017575263977, + "mean_norm/layer12": 12.673356175422668, + "mean_norm/layer13": 11.492523610591888, + "mean_norm/layer14": 11.964637100696564, + "mean_norm/layer15": 12.432619631290436, + "mean_norm/layer16": 11.557033240795135, + "mean_norm/layer17": 12.139299035072327, + "mean_norm/layer18": 11.52294272184372, + "mean_norm/layer19": 11.606126606464386, + "mean_norm/layer2": 9.222389996051788, + "mean_norm/layer20": 11.709802210330963, + "mean_norm/layer21": 11.679030537605286, + "mean_norm/layer22": 12.956490218639374, + "mean_norm/layer23": 12.913890182971954, + "mean_norm/layer3": 12.453877091407776, + "mean_norm/layer4": 10.790977239608765, + "mean_norm/layer5": 14.041500270366669, + "mean_norm/layer6": 10.130520582199097, + "mean_norm/layer7": 10.823352634906769, + "mean_norm/layer8": 11.455033659934998, + "mean_norm/layer9": 11.358659565448761, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14550 + }, + { + "epoch": 6.08, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46778858049102995, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7400739192962646, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6327, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 0.688, + "step": 14550 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.1, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2673, + "max_norm": 44.583953857421875, + "max_norm/layer0": 33.732749938964844, + "max_norm/layer1": 35.883670806884766, + "max_norm/layer10": 37.817840576171875, + "max_norm/layer11": 34.32735824584961, + "max_norm/layer12": 40.04595184326172, + "max_norm/layer13": 35.021026611328125, + "max_norm/layer14": 36.01658630371094, + "max_norm/layer15": 44.089717864990234, + "max_norm/layer16": 36.161041259765625, + "max_norm/layer17": 44.583953857421875, + "max_norm/layer18": 38.40084457397461, + "max_norm/layer19": 37.9990234375, + "max_norm/layer2": 26.546798706054688, + "max_norm/layer20": 37.787086486816406, + "max_norm/layer21": 38.14870071411133, + "max_norm/layer22": 38.677337646484375, + "max_norm/layer23": 36.53557205200195, + "max_norm/layer3": 33.816959381103516, + "max_norm/layer4": 33.839500427246094, + "max_norm/layer5": 43.33034133911133, + "max_norm/layer6": 28.18335723876953, + "max_norm/layer7": 37.20534896850586, + "max_norm/layer8": 36.09880065917969, + "max_norm/layer9": 36.45109939575195, + "mean_norm": 11.718958477179209, + "mean_norm/layer0": 11.638537287712097, + "mean_norm/layer1": 11.151164829730988, + "mean_norm/layer10": 11.460838198661804, + "mean_norm/layer11": 11.881148874759674, + "mean_norm/layer12": 12.686423182487488, + "mean_norm/layer13": 11.502274334430695, + "mean_norm/layer14": 11.975151538848877, + "mean_norm/layer15": 12.444611430168152, + "mean_norm/layer16": 11.566363215446472, + "mean_norm/layer17": 12.149612188339233, + "mean_norm/layer18": 11.531615495681763, + "mean_norm/layer19": 11.615218698978424, + "mean_norm/layer2": 9.226134121418, + "mean_norm/layer20": 11.718867301940918, + "mean_norm/layer21": 11.688138842582703, + "mean_norm/layer22": 12.968413412570953, + "mean_norm/layer23": 12.926041781902313, + "mean_norm/layer3": 12.467107772827148, + "mean_norm/layer4": 10.79892909526825, + "mean_norm/layer5": 14.058703899383545, + "mean_norm/layer6": 10.13658756017685, + "mean_norm/layer7": 10.831100225448608, + "mean_norm/layer8": 11.464323878288269, + "mean_norm/layer9": 11.367696285247803, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14600 + }, + { + "epoch": 6.1, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4664500715899458, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7531161308288574, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6421, + "eval_samples_per_second": 20.701, + "eval_steps_per_second": 0.687, + "step": 14600 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.12, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2826, + "max_norm": 44.69528579711914, + "max_norm/layer0": 33.810848236083984, + "max_norm/layer1": 35.97419357299805, + "max_norm/layer10": 37.910186767578125, + "max_norm/layer11": 34.40093994140625, + "max_norm/layer12": 40.16526412963867, + "max_norm/layer13": 35.1344108581543, + "max_norm/layer14": 36.102210998535156, + "max_norm/layer15": 44.21253967285156, + "max_norm/layer16": 36.24266815185547, + "max_norm/layer17": 44.69528579711914, + "max_norm/layer18": 38.483097076416016, + "max_norm/layer19": 38.10674285888672, + "max_norm/layer2": 26.580692291259766, + "max_norm/layer20": 37.87656021118164, + "max_norm/layer21": 38.24087905883789, + "max_norm/layer22": 38.77226257324219, + "max_norm/layer23": 36.63397979736328, + "max_norm/layer3": 33.88368225097656, + "max_norm/layer4": 33.91764831542969, + "max_norm/layer5": 43.41983413696289, + "max_norm/layer6": 28.235586166381836, + "max_norm/layer7": 37.27918243408203, + "max_norm/layer8": 36.18343734741211, + "max_norm/layer9": 36.5324821472168, + "mean_norm": 11.72901346286138, + "mean_norm/layer0": 11.652945280075073, + "mean_norm/layer1": 11.160664916038513, + "mean_norm/layer10": 11.469777524471283, + "mean_norm/layer11": 11.891315817832947, + "mean_norm/layer12": 12.6994588971138, + "mean_norm/layer13": 11.511991381645203, + "mean_norm/layer14": 11.985653817653656, + "mean_norm/layer15": 12.45661973953247, + "mean_norm/layer16": 11.575735986232758, + "mean_norm/layer17": 12.159762263298035, + "mean_norm/layer18": 11.540223777294159, + "mean_norm/layer19": 11.624176979064941, + "mean_norm/layer2": 9.229885399341583, + "mean_norm/layer20": 11.727642595767975, + "mean_norm/layer21": 11.697233855724335, + "mean_norm/layer22": 12.980267107486725, + "mean_norm/layer23": 12.938136041164398, + "mean_norm/layer3": 12.480332374572754, + "mean_norm/layer4": 10.80697101354599, + "mean_norm/layer5": 14.075869083404541, + "mean_norm/layer6": 10.142605304718018, + "mean_norm/layer7": 10.838842630386353, + "mean_norm/layer8": 11.4734987616539, + "mean_norm/layer9": 11.376712560653687, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14650 + }, + { + "epoch": 6.12, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4675654956741826, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7478952407836914, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6343, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 0.688, + "step": 14650 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.14, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2803, + "max_norm": 44.81999969482422, + "max_norm/layer0": 33.90229415893555, + "max_norm/layer1": 36.06707000732422, + "max_norm/layer10": 38.000553131103516, + "max_norm/layer11": 34.46437072753906, + "max_norm/layer12": 40.27119445800781, + "max_norm/layer13": 35.24424362182617, + "max_norm/layer14": 36.18069076538086, + "max_norm/layer15": 44.345882415771484, + "max_norm/layer16": 36.323299407958984, + "max_norm/layer17": 44.81999969482422, + "max_norm/layer18": 38.57911682128906, + "max_norm/layer19": 38.21243667602539, + "max_norm/layer2": 26.61791229248047, + "max_norm/layer20": 37.95322036743164, + "max_norm/layer21": 38.327857971191406, + "max_norm/layer22": 38.86759948730469, + "max_norm/layer23": 36.73441696166992, + "max_norm/layer3": 33.94342041015625, + "max_norm/layer4": 33.98491668701172, + "max_norm/layer5": 43.51378631591797, + "max_norm/layer6": 28.28629493713379, + "max_norm/layer7": 37.365936279296875, + "max_norm/layer8": 36.26069641113281, + "max_norm/layer9": 36.62409210205078, + "mean_norm": 11.73909062643846, + "mean_norm/layer0": 11.667441129684448, + "mean_norm/layer1": 11.170315623283386, + "mean_norm/layer10": 11.478734910488129, + "mean_norm/layer11": 11.901362717151642, + "mean_norm/layer12": 12.712479770183563, + "mean_norm/layer13": 11.521682798862457, + "mean_norm/layer14": 11.996141493320465, + "mean_norm/layer15": 12.4685178399086, + "mean_norm/layer16": 11.585081934928894, + "mean_norm/layer17": 12.170037686824799, + "mean_norm/layer18": 11.548860013484955, + "mean_norm/layer19": 11.633151412010193, + "mean_norm/layer2": 9.233680367469788, + "mean_norm/layer20": 11.736494660377502, + "mean_norm/layer21": 11.706235766410828, + "mean_norm/layer22": 12.99212795495987, + "mean_norm/layer23": 12.950253963470459, + "mean_norm/layer3": 12.49367219209671, + "mean_norm/layer4": 10.815063416957855, + "mean_norm/layer5": 14.093105018138885, + "mean_norm/layer6": 10.148611605167389, + "mean_norm/layer7": 10.846603572368622, + "mean_norm/layer8": 11.482750594615936, + "mean_norm/layer9": 11.385768592357635, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14700 + }, + { + "epoch": 6.14, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4669651947124842, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.744550943374634, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8594, + "eval_samples_per_second": 20.321, + "eval_steps_per_second": 0.675, + "step": 14700 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.16, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.2888, + "max_norm": 44.948341369628906, + "max_norm/layer0": 33.99632263183594, + "max_norm/layer1": 36.15312957763672, + "max_norm/layer10": 38.092010498046875, + "max_norm/layer11": 34.52595901489258, + "max_norm/layer12": 40.37563705444336, + "max_norm/layer13": 35.3314094543457, + "max_norm/layer14": 36.26191711425781, + "max_norm/layer15": 44.47978973388672, + "max_norm/layer16": 36.41969299316406, + "max_norm/layer17": 44.948341369628906, + "max_norm/layer18": 38.67579650878906, + "max_norm/layer19": 38.30149841308594, + "max_norm/layer2": 26.659557342529297, + "max_norm/layer20": 38.041748046875, + "max_norm/layer21": 38.415489196777344, + "max_norm/layer22": 38.947418212890625, + "max_norm/layer23": 36.82078552246094, + "max_norm/layer3": 34.01167678833008, + "max_norm/layer4": 34.06661605834961, + "max_norm/layer5": 43.61132049560547, + "max_norm/layer6": 28.341476440429688, + "max_norm/layer7": 37.45941925048828, + "max_norm/layer8": 36.348426818847656, + "max_norm/layer9": 36.70441436767578, + "mean_norm": 11.749220199882984, + "mean_norm/layer0": 11.682098507881165, + "mean_norm/layer1": 11.180002629756927, + "mean_norm/layer10": 11.487772464752197, + "mean_norm/layer11": 11.911587059497833, + "mean_norm/layer12": 12.725587904453278, + "mean_norm/layer13": 11.531331658363342, + "mean_norm/layer14": 12.006726801395416, + "mean_norm/layer15": 12.48053240776062, + "mean_norm/layer16": 11.594469606876373, + "mean_norm/layer17": 12.180344343185425, + "mean_norm/layer18": 11.557434797286987, + "mean_norm/layer19": 11.642093479633331, + "mean_norm/layer2": 9.237485826015472, + "mean_norm/layer20": 11.745355069637299, + "mean_norm/layer21": 11.715200185775757, + "mean_norm/layer22": 13.004086434841156, + "mean_norm/layer23": 12.962449193000793, + "mean_norm/layer3": 12.507059156894684, + "mean_norm/layer4": 10.823196411132812, + "mean_norm/layer5": 14.110482037067413, + "mean_norm/layer6": 10.154706180095673, + "mean_norm/layer7": 10.854439437389374, + "mean_norm/layer8": 11.492040276527405, + "mean_norm/layer9": 11.394802927970886, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14750 + }, + { + "epoch": 6.16, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.4657443123511923, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.750763416290283, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.67, + "eval_samples_per_second": 20.651, + "eval_steps_per_second": 0.686, + "step": 14750 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.18, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.303, + "max_norm": 45.073246002197266, + "max_norm/layer0": 34.08710861206055, + "max_norm/layer1": 36.244224548339844, + "max_norm/layer10": 38.180023193359375, + "max_norm/layer11": 34.58510971069336, + "max_norm/layer12": 40.496421813964844, + "max_norm/layer13": 35.42164993286133, + "max_norm/layer14": 36.34925079345703, + "max_norm/layer15": 44.600223541259766, + "max_norm/layer16": 36.52353286743164, + "max_norm/layer17": 45.073246002197266, + "max_norm/layer18": 38.772789001464844, + "max_norm/layer19": 38.385990142822266, + "max_norm/layer2": 26.702438354492188, + "max_norm/layer20": 38.13774871826172, + "max_norm/layer21": 38.51622009277344, + "max_norm/layer22": 39.0334358215332, + "max_norm/layer23": 36.904296875, + "max_norm/layer3": 34.07844543457031, + "max_norm/layer4": 34.143314361572266, + "max_norm/layer5": 43.70988845825195, + "max_norm/layer6": 28.39101219177246, + "max_norm/layer7": 37.5562629699707, + "max_norm/layer8": 36.42280578613281, + "max_norm/layer9": 36.77370071411133, + "mean_norm": 11.759335647026697, + "mean_norm/layer0": 11.696792960166931, + "mean_norm/layer1": 11.189741432666779, + "mean_norm/layer10": 11.496793627738953, + "mean_norm/layer11": 11.921910107135773, + "mean_norm/layer12": 12.73866891860962, + "mean_norm/layer13": 11.541031777858734, + "mean_norm/layer14": 12.017287492752075, + "mean_norm/layer15": 12.492536306381226, + "mean_norm/layer16": 11.603844463825226, + "mean_norm/layer17": 12.190562188625336, + "mean_norm/layer18": 11.566004931926727, + "mean_norm/layer19": 11.651012122631073, + "mean_norm/layer2": 9.241271734237671, + "mean_norm/layer20": 11.754229307174683, + "mean_norm/layer21": 11.724102795124054, + "mean_norm/layer22": 13.015969455242157, + "mean_norm/layer23": 12.974500477313995, + "mean_norm/layer3": 12.520442187786102, + "mean_norm/layer4": 10.831291019916534, + "mean_norm/layer5": 14.127792298793793, + "mean_norm/layer6": 10.160741567611694, + "mean_norm/layer7": 10.862253546714783, + "mean_norm/layer8": 11.501340448856354, + "mean_norm/layer9": 11.403934359550476, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14800 + }, + { + "epoch": 6.18, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46723289649270106, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.738095283508301, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6524, + "eval_samples_per_second": 20.683, + "eval_steps_per_second": 0.687, + "step": 14800 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.2, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3071, + "max_norm": 45.186065673828125, + "max_norm/layer0": 34.180145263671875, + "max_norm/layer1": 36.340614318847656, + "max_norm/layer10": 38.263370513916016, + "max_norm/layer11": 34.65528106689453, + "max_norm/layer12": 40.61335754394531, + "max_norm/layer13": 35.51411437988281, + "max_norm/layer14": 36.4224739074707, + "max_norm/layer15": 44.72835159301758, + "max_norm/layer16": 36.632625579833984, + "max_norm/layer17": 45.186065673828125, + "max_norm/layer18": 38.86900329589844, + "max_norm/layer19": 38.483543395996094, + "max_norm/layer2": 26.746105194091797, + "max_norm/layer20": 38.22907638549805, + "max_norm/layer21": 38.60087203979492, + "max_norm/layer22": 39.13743591308594, + "max_norm/layer23": 36.99153518676758, + "max_norm/layer3": 34.13496017456055, + "max_norm/layer4": 34.21876525878906, + "max_norm/layer5": 43.80707931518555, + "max_norm/layer6": 28.444496154785156, + "max_norm/layer7": 37.6572380065918, + "max_norm/layer8": 36.48862075805664, + "max_norm/layer9": 36.847434997558594, + "mean_norm": 11.769410625100136, + "mean_norm/layer0": 11.71136349439621, + "mean_norm/layer1": 11.19951182603836, + "mean_norm/layer10": 11.505762279033661, + "mean_norm/layer11": 11.932011187076569, + "mean_norm/layer12": 12.751639366149902, + "mean_norm/layer13": 11.550610899925232, + "mean_norm/layer14": 12.027763426303864, + "mean_norm/layer15": 12.504477262496948, + "mean_norm/layer16": 11.613188326358795, + "mean_norm/layer17": 12.20076310634613, + "mean_norm/layer18": 11.574527025222778, + "mean_norm/layer19": 11.660000503063202, + "mean_norm/layer2": 9.245114207267761, + "mean_norm/layer20": 11.763050854206085, + "mean_norm/layer21": 11.733014643192291, + "mean_norm/layer22": 13.027836441993713, + "mean_norm/layer23": 12.986533343791962, + "mean_norm/layer3": 12.533765077590942, + "mean_norm/layer4": 10.839352071285248, + "mean_norm/layer5": 14.145084381103516, + "mean_norm/layer6": 10.166761040687561, + "mean_norm/layer7": 10.870099246501923, + "mean_norm/layer8": 11.51064658164978, + "mean_norm/layer9": 11.412978410720825, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14850 + }, + { + "epoch": 6.2, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46671371728258354, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7497682571411133, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 10.8261, + "eval_samples_per_second": 22.261, + "eval_steps_per_second": 0.739, + "step": 14850 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.22, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3014, + "max_norm": 45.308223724365234, + "max_norm/layer0": 34.267417907714844, + "max_norm/layer1": 36.43744659423828, + "max_norm/layer10": 38.35849380493164, + "max_norm/layer11": 34.72025680541992, + "max_norm/layer12": 40.71356201171875, + "max_norm/layer13": 35.608646392822266, + "max_norm/layer14": 36.5001220703125, + "max_norm/layer15": 44.83946228027344, + "max_norm/layer16": 36.73179244995117, + "max_norm/layer17": 45.308223724365234, + "max_norm/layer18": 38.9741325378418, + "max_norm/layer19": 38.586544036865234, + "max_norm/layer2": 26.78317642211914, + "max_norm/layer20": 38.316619873046875, + "max_norm/layer21": 38.68571853637695, + "max_norm/layer22": 39.225032806396484, + "max_norm/layer23": 37.06938171386719, + "max_norm/layer3": 34.203548431396484, + "max_norm/layer4": 34.2883415222168, + "max_norm/layer5": 43.896480560302734, + "max_norm/layer6": 28.498565673828125, + "max_norm/layer7": 37.7492790222168, + "max_norm/layer8": 36.55672073364258, + "max_norm/layer9": 36.92335891723633, + "mean_norm": 11.779515077670416, + "mean_norm/layer0": 11.726049065589905, + "mean_norm/layer1": 11.209324061870575, + "mean_norm/layer10": 11.514764368534088, + "mean_norm/layer11": 11.942122519016266, + "mean_norm/layer12": 12.764708518981934, + "mean_norm/layer13": 11.560275077819824, + "mean_norm/layer14": 12.038271605968475, + "mean_norm/layer15": 12.51647001504898, + "mean_norm/layer16": 11.622543811798096, + "mean_norm/layer17": 12.210929572582245, + "mean_norm/layer18": 11.583010852336884, + "mean_norm/layer19": 11.668940365314484, + "mean_norm/layer2": 9.248961925506592, + "mean_norm/layer20": 11.771803140640259, + "mean_norm/layer21": 11.74181979894638, + "mean_norm/layer22": 13.039653956890106, + "mean_norm/layer23": 12.998541593551636, + "mean_norm/layer3": 12.547242283821106, + "mean_norm/layer4": 10.84747463464737, + "mean_norm/layer5": 14.16251653432846, + "mean_norm/layer6": 10.172904789447784, + "mean_norm/layer7": 10.877913773059845, + "mean_norm/layer8": 11.520046174526215, + "mean_norm/layer9": 11.422073423862457, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14900 + }, + { + "epoch": 6.22, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46574025626361326, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.743490219116211, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.8386, + "eval_samples_per_second": 20.357, + "eval_steps_per_second": 0.676, + "step": 14900 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.24, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3088, + "max_norm": 45.41685104370117, + "max_norm/layer0": 34.35284423828125, + "max_norm/layer1": 36.526798248291016, + "max_norm/layer10": 38.4525146484375, + "max_norm/layer11": 34.7932243347168, + "max_norm/layer12": 40.7994499206543, + "max_norm/layer13": 35.694664001464844, + "max_norm/layer14": 36.587955474853516, + "max_norm/layer15": 44.962310791015625, + "max_norm/layer16": 36.83222198486328, + "max_norm/layer17": 45.41685104370117, + "max_norm/layer18": 39.11237335205078, + "max_norm/layer19": 38.691707611083984, + "max_norm/layer2": 26.809534072875977, + "max_norm/layer20": 38.412635803222656, + "max_norm/layer21": 38.78028869628906, + "max_norm/layer22": 39.322757720947266, + "max_norm/layer23": 37.13923263549805, + "max_norm/layer3": 34.273311614990234, + "max_norm/layer4": 34.368839263916016, + "max_norm/layer5": 43.9959716796875, + "max_norm/layer6": 28.55388832092285, + "max_norm/layer7": 37.8399658203125, + "max_norm/layer8": 36.626319885253906, + "max_norm/layer9": 36.991241455078125, + "mean_norm": 11.789648773769537, + "mean_norm/layer0": 11.740796387195587, + "mean_norm/layer1": 11.219213783740997, + "mean_norm/layer10": 11.523796737194061, + "mean_norm/layer11": 11.952241718769073, + "mean_norm/layer12": 12.777762591838837, + "mean_norm/layer13": 11.569939851760864, + "mean_norm/layer14": 12.048766016960144, + "mean_norm/layer15": 12.528478980064392, + "mean_norm/layer16": 11.63189560174942, + "mean_norm/layer17": 12.221157014369965, + "mean_norm/layer18": 11.591578304767609, + "mean_norm/layer19": 11.6779265999794, + "mean_norm/layer2": 9.252777576446533, + "mean_norm/layer20": 11.780601918697357, + "mean_norm/layer21": 11.750674307346344, + "mean_norm/layer22": 13.051563382148743, + "mean_norm/layer23": 13.010630786418915, + "mean_norm/layer3": 12.56077265739441, + "mean_norm/layer4": 10.855627298355103, + "mean_norm/layer5": 14.179958462715149, + "mean_norm/layer6": 10.179086148738861, + "mean_norm/layer7": 10.885732650756836, + "mean_norm/layer8": 11.529394507408142, + "mean_norm/layer9": 11.43119728565216, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 14950 + }, + { + "epoch": 6.24, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46645818376510384, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7555625438690186, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6207, + "eval_samples_per_second": 20.739, + "eval_steps_per_second": 0.688, + "step": 14950 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.26, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "learning_rate": 0.0005, + "loss": 2.3235, + "max_norm": 45.539119720458984, + "max_norm/layer0": 34.44173049926758, + "max_norm/layer1": 36.61558151245117, + "max_norm/layer10": 38.54380416870117, + "max_norm/layer11": 34.865203857421875, + "max_norm/layer12": 40.908504486083984, + "max_norm/layer13": 35.78108215332031, + "max_norm/layer14": 36.67228317260742, + "max_norm/layer15": 45.083438873291016, + "max_norm/layer16": 36.927913665771484, + "max_norm/layer17": 45.539119720458984, + "max_norm/layer18": 39.2352409362793, + "max_norm/layer19": 38.779598236083984, + "max_norm/layer2": 26.836795806884766, + "max_norm/layer20": 38.50577163696289, + "max_norm/layer21": 38.87571334838867, + "max_norm/layer22": 39.42427062988281, + "max_norm/layer23": 37.21847915649414, + "max_norm/layer3": 34.34575271606445, + "max_norm/layer4": 34.4432258605957, + "max_norm/layer5": 44.077754974365234, + "max_norm/layer6": 28.6057071685791, + "max_norm/layer7": 37.91745376586914, + "max_norm/layer8": 36.69032287597656, + "max_norm/layer9": 37.08796691894531, + "mean_norm": 11.799732064207396, + "mean_norm/layer0": 11.755437850952148, + "mean_norm/layer1": 11.22901839017868, + "mean_norm/layer10": 11.532833635807037, + "mean_norm/layer11": 11.962444841861725, + "mean_norm/layer12": 12.79077160358429, + "mean_norm/layer13": 11.57960969209671, + "mean_norm/layer14": 12.059264957904816, + "mean_norm/layer15": 12.540440499782562, + "mean_norm/layer16": 11.641206741333008, + "mean_norm/layer17": 12.231300234794617, + "mean_norm/layer18": 11.600049555301666, + "mean_norm/layer19": 11.686796128749847, + "mean_norm/layer2": 9.256644666194916, + "mean_norm/layer20": 11.78922188282013, + "mean_norm/layer21": 11.759462356567383, + "mean_norm/layer22": 13.063357532024384, + "mean_norm/layer23": 13.022553265094757, + "mean_norm/layer3": 12.574194192886353, + "mean_norm/layer4": 10.863756775856018, + "mean_norm/layer5": 14.197384178638458, + "mean_norm/layer6": 10.185243308544159, + "mean_norm/layer7": 10.893572747707367, + "mean_norm/layer8": 11.53871750831604, + "mean_norm/layer9": 11.440286993980408, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 15000 + }, + { + "epoch": 6.26, + "eval_MSE/layer0": 0.0, + "eval_MSE/layer1": 0.0, + "eval_MSE/layer10": 0.0, + "eval_MSE/layer11": 0.0, + "eval_MSE/layer12": 0.0, + "eval_MSE/layer13": 0.0, + "eval_MSE/layer14": 0.0, + "eval_MSE/layer15": 0.0, + "eval_MSE/layer16": 0.0, + "eval_MSE/layer17": 0.0, + "eval_MSE/layer18": 0.0, + "eval_MSE/layer19": 0.0, + "eval_MSE/layer2": 0.0, + "eval_MSE/layer20": 0.0, + "eval_MSE/layer21": 0.0, + "eval_MSE/layer22": 0.0, + "eval_MSE/layer23": 0.0, + "eval_MSE/layer3": 0.0, + "eval_MSE/layer4": 0.0, + "eval_MSE/layer5": 0.0, + "eval_MSE/layer6": 0.0, + "eval_MSE/layer7": 0.0, + "eval_MSE/layer8": 0.0, + "eval_MSE/layer9": 0.0, + "eval_accuracy": 0.46677861468384824, + "eval_dead_code_fraction/layer0": 1.0, + "eval_dead_code_fraction/layer1": 1.0, + "eval_dead_code_fraction/layer10": 1.0, + "eval_dead_code_fraction/layer11": 1.0, + "eval_dead_code_fraction/layer12": 1.0, + "eval_dead_code_fraction/layer13": 1.0, + "eval_dead_code_fraction/layer14": 1.0, + "eval_dead_code_fraction/layer15": 1.0, + "eval_dead_code_fraction/layer16": 1.0, + "eval_dead_code_fraction/layer17": 1.0, + "eval_dead_code_fraction/layer18": 1.0, + "eval_dead_code_fraction/layer19": 1.0, + "eval_dead_code_fraction/layer2": 1.0, + "eval_dead_code_fraction/layer20": 1.0, + "eval_dead_code_fraction/layer21": 1.0, + "eval_dead_code_fraction/layer22": 1.0, + "eval_dead_code_fraction/layer23": 1.0, + "eval_dead_code_fraction/layer3": 1.0, + "eval_dead_code_fraction/layer4": 1.0, + "eval_dead_code_fraction/layer5": 1.0, + "eval_dead_code_fraction/layer6": 1.0, + "eval_dead_code_fraction/layer7": 1.0, + "eval_dead_code_fraction/layer8": 1.0, + "eval_dead_code_fraction/layer9": 1.0, + "eval_input_norm/layer0": 0.0, + "eval_input_norm/layer1": 0.0, + "eval_input_norm/layer10": 0.0, + "eval_input_norm/layer11": 0.0, + "eval_input_norm/layer12": 0.0, + "eval_input_norm/layer13": 0.0, + "eval_input_norm/layer14": 0.0, + "eval_input_norm/layer15": 0.0, + "eval_input_norm/layer16": 0.0, + "eval_input_norm/layer17": 0.0, + "eval_input_norm/layer18": 0.0, + "eval_input_norm/layer19": 0.0, + "eval_input_norm/layer2": 0.0, + "eval_input_norm/layer20": 0.0, + "eval_input_norm/layer21": 0.0, + "eval_input_norm/layer22": 0.0, + "eval_input_norm/layer23": 0.0, + "eval_input_norm/layer3": 0.0, + "eval_input_norm/layer4": 0.0, + "eval_input_norm/layer5": 0.0, + "eval_input_norm/layer6": 0.0, + "eval_input_norm/layer7": 0.0, + "eval_input_norm/layer8": 0.0, + "eval_input_norm/layer9": 0.0, + "eval_loss": 2.7446389198303223, + "eval_multicode_k": 8, + "eval_output_norm/layer0": 0.0, + "eval_output_norm/layer1": 0.0, + "eval_output_norm/layer10": 0.0, + "eval_output_norm/layer11": 0.0, + "eval_output_norm/layer12": 0.0, + "eval_output_norm/layer13": 0.0, + "eval_output_norm/layer14": 0.0, + "eval_output_norm/layer15": 0.0, + "eval_output_norm/layer16": 0.0, + "eval_output_norm/layer17": 0.0, + "eval_output_norm/layer18": 0.0, + "eval_output_norm/layer19": 0.0, + "eval_output_norm/layer2": 0.0, + "eval_output_norm/layer20": 0.0, + "eval_output_norm/layer21": 0.0, + "eval_output_norm/layer22": 0.0, + "eval_output_norm/layer23": 0.0, + "eval_output_norm/layer3": 0.0, + "eval_output_norm/layer4": 0.0, + "eval_output_norm/layer5": 0.0, + "eval_output_norm/layer6": 0.0, + "eval_output_norm/layer7": 0.0, + "eval_output_norm/layer8": 0.0, + "eval_output_norm/layer9": 0.0, + "eval_runtime": 11.6412, + "eval_samples_per_second": 20.702, + "eval_steps_per_second": 0.687, + "step": 15000 + }, + { + "MSE": 0.0, + "MSE/layer0": 0.0, + "MSE/layer1": 0.0, + "MSE/layer10": 0.0, + "MSE/layer11": 0.0, + "MSE/layer12": 0.0, + "MSE/layer13": 0.0, + "MSE/layer14": 0.0, + "MSE/layer15": 0.0, + "MSE/layer16": 0.0, + "MSE/layer17": 0.0, + "MSE/layer18": 0.0, + "MSE/layer19": 0.0, + "MSE/layer2": 0.0, + "MSE/layer20": 0.0, + "MSE/layer21": 0.0, + "MSE/layer22": 0.0, + "MSE/layer23": 0.0, + "MSE/layer3": 0.0, + "MSE/layer4": 0.0, + "MSE/layer5": 0.0, + "MSE/layer6": 0.0, + "MSE/layer7": 0.0, + "MSE/layer8": 0.0, + "MSE/layer9": 0.0, + "dead_code_fraction": 1.0, + "dead_code_fraction/layer0": 1.0, + "dead_code_fraction/layer1": 1.0, + "dead_code_fraction/layer10": 1.0, + "dead_code_fraction/layer11": 1.0, + "dead_code_fraction/layer12": 1.0, + "dead_code_fraction/layer13": 1.0, + "dead_code_fraction/layer14": 1.0, + "dead_code_fraction/layer15": 1.0, + "dead_code_fraction/layer16": 1.0, + "dead_code_fraction/layer17": 1.0, + "dead_code_fraction/layer18": 1.0, + "dead_code_fraction/layer19": 1.0, + "dead_code_fraction/layer2": 1.0, + "dead_code_fraction/layer20": 1.0, + "dead_code_fraction/layer21": 1.0, + "dead_code_fraction/layer22": 1.0, + "dead_code_fraction/layer23": 1.0, + "dead_code_fraction/layer3": 1.0, + "dead_code_fraction/layer4": 1.0, + "dead_code_fraction/layer5": 1.0, + "dead_code_fraction/layer6": 1.0, + "dead_code_fraction/layer7": 1.0, + "dead_code_fraction/layer8": 1.0, + "dead_code_fraction/layer9": 1.0, + "epoch": 6.26, + "input_norm": 0.0, + "input_norm/layer0": 0.0, + "input_norm/layer1": 0.0, + "input_norm/layer10": 0.0, + "input_norm/layer11": 0.0, + "input_norm/layer12": 0.0, + "input_norm/layer13": 0.0, + "input_norm/layer14": 0.0, + "input_norm/layer15": 0.0, + "input_norm/layer16": 0.0, + "input_norm/layer17": 0.0, + "input_norm/layer18": 0.0, + "input_norm/layer19": 0.0, + "input_norm/layer2": 0.0, + "input_norm/layer20": 0.0, + "input_norm/layer21": 0.0, + "input_norm/layer22": 0.0, + "input_norm/layer23": 0.0, + "input_norm/layer3": 0.0, + "input_norm/layer4": 0.0, + "input_norm/layer5": 0.0, + "input_norm/layer6": 0.0, + "input_norm/layer7": 0.0, + "input_norm/layer8": 0.0, + "input_norm/layer9": 0.0, + "max_norm": 45.539119720458984, + "max_norm/layer0": 34.44173049926758, + "max_norm/layer1": 36.61558151245117, + "max_norm/layer10": 38.54380416870117, + "max_norm/layer11": 34.865203857421875, + "max_norm/layer12": 40.908504486083984, + "max_norm/layer13": 35.78108215332031, + "max_norm/layer14": 36.67228317260742, + "max_norm/layer15": 45.083438873291016, + "max_norm/layer16": 36.927913665771484, + "max_norm/layer17": 45.539119720458984, + "max_norm/layer18": 39.2352409362793, + "max_norm/layer19": 38.779598236083984, + "max_norm/layer2": 26.836795806884766, + "max_norm/layer20": 38.50577163696289, + "max_norm/layer21": 38.87571334838867, + "max_norm/layer22": 39.42427062988281, + "max_norm/layer23": 37.21847915649414, + "max_norm/layer3": 34.34575271606445, + "max_norm/layer4": 34.4432258605957, + "max_norm/layer5": 44.077754974365234, + "max_norm/layer6": 28.6057071685791, + "max_norm/layer7": 37.91745376586914, + "max_norm/layer8": 36.69032287597656, + "max_norm/layer9": 37.08796691894531, + "mean_norm": 11.799732064207396, + "mean_norm/layer0": 11.755437850952148, + "mean_norm/layer1": 11.22901839017868, + "mean_norm/layer10": 11.532833635807037, + "mean_norm/layer11": 11.962444841861725, + "mean_norm/layer12": 12.79077160358429, + "mean_norm/layer13": 11.57960969209671, + "mean_norm/layer14": 12.059264957904816, + "mean_norm/layer15": 12.540440499782562, + "mean_norm/layer16": 11.641206741333008, + "mean_norm/layer17": 12.231300234794617, + "mean_norm/layer18": 11.600049555301666, + "mean_norm/layer19": 11.686796128749847, + "mean_norm/layer2": 9.256644666194916, + "mean_norm/layer20": 11.78922188282013, + "mean_norm/layer21": 11.759462356567383, + "mean_norm/layer22": 13.063357532024384, + "mean_norm/layer23": 13.022553265094757, + "mean_norm/layer3": 12.574194192886353, + "mean_norm/layer4": 10.863756775856018, + "mean_norm/layer5": 14.197384178638458, + "mean_norm/layer6": 10.185243308544159, + "mean_norm/layer7": 10.893572747707367, + "mean_norm/layer8": 11.53871750831604, + "mean_norm/layer9": 11.440286993980408, + "multicode_k": 8, + "output_norm": 0.0, + "output_norm/layer0": 0.0, + "output_norm/layer1": 0.0, + "output_norm/layer10": 0.0, + "output_norm/layer11": 0.0, + "output_norm/layer12": 0.0, + "output_norm/layer13": 0.0, + "output_norm/layer14": 0.0, + "output_norm/layer15": 0.0, + "output_norm/layer16": 0.0, + "output_norm/layer17": 0.0, + "output_norm/layer18": 0.0, + "output_norm/layer19": 0.0, + "output_norm/layer2": 0.0, + "output_norm/layer20": 0.0, + "output_norm/layer21": 0.0, + "output_norm/layer22": 0.0, + "output_norm/layer23": 0.0, + "output_norm/layer3": 0.0, + "output_norm/layer4": 0.0, + "output_norm/layer5": 0.0, + "output_norm/layer6": 0.0, + "output_norm/layer7": 0.0, + "output_norm/layer8": 0.0, + "output_norm/layer9": 0.0, + "step": 15000, + "total_flos": 1.5651549796420813e+18, + "train_loss": 2.685329116312663, + "train_runtime": 43939.9354, + "train_samples_per_second": 16.386, + "train_steps_per_second": 0.341 + } + ], + "max_steps": 15000, + "num_train_epochs": 7, + "total_flos": 1.5651549796420813e+18, + "trial_name": null, + "trial_params": null +}