|
{ |
|
"MSE": 0.0, |
|
"MSE/layer0": 0.0, |
|
"dead_code_fraction": 1.0, |
|
"dead_code_fraction/layer0": 1.0, |
|
"epoch": 10.43, |
|
"eval_MSE/layer0": 6073.8636798095695, |
|
"eval_accuracy": 0.5791389432485323, |
|
"eval_dead_code_fraction/layer0": 0.1981725, |
|
"eval_input_norm/layer0": 0.7182212994247673, |
|
"eval_loss": 1.6604058742523193, |
|
"eval_multicode_k": 1, |
|
"eval_output_norm/layer0": 76.78913438796998, |
|
"eval_runtime": 6.7146, |
|
"eval_samples": 100, |
|
"eval_samples_per_second": 14.893, |
|
"eval_steps_per_second": 0.298, |
|
"input_norm": 0.0, |
|
"input_norm/layer0": 0.0, |
|
"loss": 1.6774777018260956, |
|
"max_norm": 153.29054260253906, |
|
"max_norm/layer0": 153.29054260253906, |
|
"mean_norm": 75.17323780059814, |
|
"mean_norm/layer0": 75.17323780059814, |
|
"multicode_k": 1, |
|
"output_norm": 0.0, |
|
"output_norm/layer0": 0.0, |
|
"perplexity": 5.261445896555633, |
|
"runtime": 132212.7109, |
|
"samples_per_second": 72.61, |
|
"steps_per_second": 0.756, |
|
"train_samples": 920563 |
|
} |