File size: 2,261 Bytes
d2a7b67
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
{
    "MSE": 0.0,
    "MSE/layer0": 0.0,
    "MSE/layer1": 0.0,
    "MSE/layer2": 0.0,
    "MSE/layer3": 0.0,
    "dead_code_fraction": 1.0,
    "dead_code_fraction/layer0": 1.0,
    "dead_code_fraction/layer1": 1.0,
    "dead_code_fraction/layer2": 1.0,
    "dead_code_fraction/layer3": 1.0,
    "epoch": 1.0,
    "eval_MSE/layer0": 220380.4595384912,
    "eval_MSE/layer1": 132.78432877894963,
    "eval_MSE/layer2": 365.9396393365076,
    "eval_MSE/layer3": 415.98040078389045,
    "eval_accuracy": 0.4525254617525837,
    "eval_dead_code_fraction/layer0": 0.99694,
    "eval_dead_code_fraction/layer1": 0.9535,
    "eval_dead_code_fraction/layer2": 0.93486,
    "eval_dead_code_fraction/layer3": 0.98186,
    "eval_first_transition_accuracy": 0.88,
    "eval_input_norm/layer0": 333.77172351868165,
    "eval_input_norm/layer1": 6.54500140022604,
    "eval_input_norm/layer2": 6.137018968109251,
    "eval_input_norm/layer3": 7.40972196774554,
    "eval_loss": 1.2691402435302734,
    "eval_multicode_k": 1,
    "eval_output_norm/layer0": 12.936006403074337,
    "eval_output_norm/layer1": 13.144865618203756,
    "eval_output_norm/layer2": 18.324818944643734,
    "eval_output_norm/layer3": 18.466466705456643,
    "eval_runtime": 40.0743,
    "eval_samples_per_second": 817.682,
    "eval_steps_per_second": 1.597,
    "eval_transition_accuracy": 0.5633870967741935,
    "input_norm": 0.0,
    "input_norm/layer0": 0.0,
    "input_norm/layer1": 0.0,
    "input_norm/layer2": 0.0,
    "input_norm/layer3": 0.0,
    "loss": 1.313426919734478,
    "max_norm": 46.33829879760742,
    "max_norm/layer0": 17.856664657592773,
    "max_norm/layer1": 20.084186553955078,
    "max_norm/layer2": 33.940242767333984,
    "max_norm/layer3": 46.33829879760742,
    "mean_norm": 8.291451185941696,
    "mean_norm/layer0": 8.462452054023743,
    "mean_norm/layer1": 8.18280303478241,
    "mean_norm/layer2": 8.143204748630524,
    "mean_norm/layer3": 8.377344906330109,
    "multicode_k": 1,
    "output_norm": 0.0,
    "output_norm/layer0": 0.0,
    "output_norm/layer1": 0.0,
    "output_norm/layer2": 0.0,
    "output_norm/layer3": 0.0,
    "perplexity": 3.5577924120078235,
    "runtime": 19944.2896,
    "samples_per_second": 1026.86,
    "steps_per_second": 1.003
}