TokFSM_k1_codebook_model / train_results.json
taufeeque's picture
Add model
d2a7b67
{
"MSE": 0.0,
"MSE/layer0": 0.0,
"MSE/layer1": 0.0,
"MSE/layer2": 0.0,
"MSE/layer3": 0.0,
"dead_code_fraction": 1.0,
"dead_code_fraction/layer0": 1.0,
"dead_code_fraction/layer1": 1.0,
"dead_code_fraction/layer2": 1.0,
"dead_code_fraction/layer3": 1.0,
"epoch": 1.0,
"input_norm": 0.0,
"input_norm/layer0": 0.0,
"input_norm/layer1": 0.0,
"input_norm/layer2": 0.0,
"input_norm/layer3": 0.0,
"loss": 1.313426919734478,
"max_norm": 46.33829879760742,
"max_norm/layer0": 17.856664657592773,
"max_norm/layer1": 20.084186553955078,
"max_norm/layer2": 33.940242767333984,
"max_norm/layer3": 46.33829879760742,
"mean_norm": 8.291451185941696,
"mean_norm/layer0": 8.462452054023743,
"mean_norm/layer1": 8.18280303478241,
"mean_norm/layer2": 8.143204748630524,
"mean_norm/layer3": 8.377344906330109,
"multicode_k": 1,
"output_norm": 0.0,
"output_norm/layer0": 0.0,
"output_norm/layer1": 0.0,
"output_norm/layer2": 0.0,
"output_norm/layer3": 0.0,
"runtime": 19944.2896,
"samples_per_second": 1026.86,
"steps_per_second": 1.003
}