charsiu commited on
Commit
8059efa
1 Parent(s): 5d7ae46

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +151 -0
trainer_state.json ADDED
@@ -0,0 +1,151 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0.5266468686454935,
5
+ "global_step": 4500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.06,
12
+ "learning_rate": 0.00015,
13
+ "loss": 2.5393,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.06,
18
+ "eval_loss": 0.4428945779800415,
19
+ "eval_phone_accuracy": 0.9003876271495096,
20
+ "eval_runtime": 16.8778,
21
+ "eval_samples_per_second": 11.85,
22
+ "eval_steps_per_second": 2.962,
23
+ "step": 500
24
+ },
25
+ {
26
+ "epoch": 0.12,
27
+ "learning_rate": 0.0003,
28
+ "loss": 0.4474,
29
+ "step": 1000
30
+ },
31
+ {
32
+ "epoch": 0.12,
33
+ "eval_loss": 0.2071739137172699,
34
+ "eval_phone_accuracy": 0.9347190787134594,
35
+ "eval_runtime": 15.9974,
36
+ "eval_samples_per_second": 12.502,
37
+ "eval_steps_per_second": 3.126,
38
+ "step": 1000
39
+ },
40
+ {
41
+ "epoch": 0.18,
42
+ "learning_rate": 0.00028011664899257687,
43
+ "loss": 0.3105,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 0.18,
48
+ "eval_loss": 0.174857959151268,
49
+ "eval_phone_accuracy": 0.94312200282699,
50
+ "eval_runtime": 16.5779,
51
+ "eval_samples_per_second": 12.064,
52
+ "eval_steps_per_second": 3.016,
53
+ "step": 1500
54
+ },
55
+ {
56
+ "epoch": 0.23,
57
+ "learning_rate": 0.0002602332979851537,
58
+ "loss": 0.2682,
59
+ "step": 2000
60
+ },
61
+ {
62
+ "epoch": 0.23,
63
+ "eval_loss": 0.16749557852745056,
64
+ "eval_phone_accuracy": 0.9447956502510471,
65
+ "eval_runtime": 15.1084,
66
+ "eval_samples_per_second": 13.238,
67
+ "eval_steps_per_second": 3.309,
68
+ "step": 2000
69
+ },
70
+ {
71
+ "epoch": 0.29,
72
+ "learning_rate": 0.0002403499469777306,
73
+ "loss": 0.2467,
74
+ "step": 2500
75
+ },
76
+ {
77
+ "epoch": 0.29,
78
+ "eval_loss": 0.15832921862602234,
79
+ "eval_phone_accuracy": 0.9478567774048926,
80
+ "eval_runtime": 14.9641,
81
+ "eval_samples_per_second": 13.365,
82
+ "eval_steps_per_second": 3.341,
83
+ "step": 2500
84
+ },
85
+ {
86
+ "epoch": 0.35,
87
+ "learning_rate": 0.00022046659597030753,
88
+ "loss": 0.2324,
89
+ "step": 3000
90
+ },
91
+ {
92
+ "epoch": 0.35,
93
+ "eval_loss": 0.14310674369335175,
94
+ "eval_phone_accuracy": 0.949885966509708,
95
+ "eval_runtime": 15.0339,
96
+ "eval_samples_per_second": 13.303,
97
+ "eval_steps_per_second": 3.326,
98
+ "step": 3000
99
+ },
100
+ {
101
+ "epoch": 0.41,
102
+ "learning_rate": 0.0002005832449628844,
103
+ "loss": 0.22,
104
+ "step": 3500
105
+ },
106
+ {
107
+ "epoch": 0.41,
108
+ "eval_loss": 0.13784204423427582,
109
+ "eval_phone_accuracy": 0.9521579645672364,
110
+ "eval_runtime": 16.1699,
111
+ "eval_samples_per_second": 12.369,
112
+ "eval_steps_per_second": 3.092,
113
+ "step": 3500
114
+ },
115
+ {
116
+ "epoch": 0.47,
117
+ "learning_rate": 0.0001806998939554613,
118
+ "loss": 0.2109,
119
+ "step": 4000
120
+ },
121
+ {
122
+ "epoch": 0.47,
123
+ "eval_loss": 0.1341935396194458,
124
+ "eval_phone_accuracy": 0.9543519168899642,
125
+ "eval_runtime": 15.6229,
126
+ "eval_samples_per_second": 12.802,
127
+ "eval_steps_per_second": 3.2,
128
+ "step": 4000
129
+ },
130
+ {
131
+ "epoch": 0.53,
132
+ "learning_rate": 0.00016081654294803816,
133
+ "loss": 0.2039,
134
+ "step": 4500
135
+ },
136
+ {
137
+ "epoch": 0.53,
138
+ "eval_loss": 0.13459673523902893,
139
+ "eval_phone_accuracy": 0.9526435824726623,
140
+ "eval_runtime": 15.5354,
141
+ "eval_samples_per_second": 12.874,
142
+ "eval_steps_per_second": 3.218,
143
+ "step": 4500
144
+ }
145
+ ],
146
+ "max_steps": 8544,
147
+ "num_train_epochs": 1,
148
+ "total_flos": 7.300030651149006e+19,
149
+ "trial_name": null,
150
+ "trial_params": null
151
+ }