Aditya3107 commited on
Commit
1fe3377
1 Parent(s): 3404dc7

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_loss": 0.4012770652770996,
4
+ "eval_runtime": 477.7855,
5
+ "eval_samples": 10859,
6
+ "eval_samples_per_second": 22.728,
7
+ "eval_steps_per_second": 0.356,
8
+ "eval_wer": 1.0929595993888983,
9
+ "train_loss": 1.7017262231735957,
10
+ "train_runtime": 141338.6512,
11
+ "train_samples": 16111,
12
+ "train_samples_per_second": 1.71,
13
+ "train_steps_per_second": 0.009
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_loss": 0.4012770652770996,
4
+ "eval_runtime": 477.7855,
5
+ "eval_samples": 10859,
6
+ "eval_samples_per_second": 22.728,
7
+ "eval_steps_per_second": 0.356,
8
+ "eval_wer": 1.0929595993888983
9
+ }
runs/Mar10_16-57-33_mlp14/events.out.tfevents.1710228527.mlp14.1591632.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:556d7b29d575850fad006148a9e43f09d274e5f355299bdea8ec76707d7b376e
3
+ size 406
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "train_loss": 1.7017262231735957,
4
+ "train_runtime": 141338.6512,
5
+ "train_samples": 16111,
6
+ "train_samples_per_second": 1.71,
7
+ "train_steps_per_second": 0.009
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 1260,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.19,
12
+ "eval_loss": 4.574927806854248,
13
+ "eval_runtime": 492.4632,
14
+ "eval_samples_per_second": 22.05,
15
+ "eval_steps_per_second": 0.345,
16
+ "eval_wer": 1.0,
17
+ "step": 100
18
+ },
19
+ {
20
+ "epoch": 2.38,
21
+ "eval_loss": 3.2543928623199463,
22
+ "eval_runtime": 477.4917,
23
+ "eval_samples_per_second": 22.742,
24
+ "eval_steps_per_second": 0.356,
25
+ "eval_wer": 1.0,
26
+ "step": 200
27
+ },
28
+ {
29
+ "epoch": 3.57,
30
+ "eval_loss": 3.110656261444092,
31
+ "eval_runtime": 470.1018,
32
+ "eval_samples_per_second": 23.099,
33
+ "eval_steps_per_second": 0.362,
34
+ "eval_wer": 1.000137922254286,
35
+ "step": 300
36
+ },
37
+ {
38
+ "epoch": 4.76,
39
+ "eval_loss": 0.9151943922042847,
40
+ "eval_runtime": 469.7177,
41
+ "eval_samples_per_second": 23.118,
42
+ "eval_steps_per_second": 0.362,
43
+ "eval_wer": 1.017081140723137,
44
+ "step": 400
45
+ },
46
+ {
47
+ "epoch": 5.95,
48
+ "learning_rate": 0.0003,
49
+ "loss": 3.9561,
50
+ "step": 500
51
+ },
52
+ {
53
+ "epoch": 5.95,
54
+ "eval_loss": 0.6422096490859985,
55
+ "eval_runtime": 477.7033,
56
+ "eval_samples_per_second": 22.732,
57
+ "eval_steps_per_second": 0.356,
58
+ "eval_wer": 1.059041334238669,
59
+ "step": 500
60
+ },
61
+ {
62
+ "epoch": 7.14,
63
+ "eval_loss": 0.49003028869628906,
64
+ "eval_runtime": 424.1123,
65
+ "eval_samples_per_second": 25.604,
66
+ "eval_steps_per_second": 0.401,
67
+ "eval_wer": 1.0866682227126125,
68
+ "step": 600
69
+ },
70
+ {
71
+ "epoch": 8.33,
72
+ "eval_loss": 0.4251333475112915,
73
+ "eval_runtime": 495.8179,
74
+ "eval_samples_per_second": 21.901,
75
+ "eval_steps_per_second": 0.343,
76
+ "eval_wer": 1.095516465795281,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 9.52,
81
+ "eval_loss": 0.4232262969017029,
82
+ "eval_runtime": 527.1122,
83
+ "eval_samples_per_second": 20.601,
84
+ "eval_steps_per_second": 0.323,
85
+ "eval_wer": 1.1464522152435919,
86
+ "step": 800
87
+ },
88
+ {
89
+ "epoch": 10.71,
90
+ "eval_loss": 0.4133465588092804,
91
+ "eval_runtime": 479.4028,
92
+ "eval_samples_per_second": 22.651,
93
+ "eval_steps_per_second": 0.355,
94
+ "eval_wer": 1.1194300628076728,
95
+ "step": 900
96
+ },
97
+ {
98
+ "epoch": 11.9,
99
+ "learning_rate": 0.00010263157894736841,
100
+ "loss": 0.2637,
101
+ "step": 1000
102
+ },
103
+ {
104
+ "epoch": 11.9,
105
+ "eval_loss": 0.3940434157848358,
106
+ "eval_runtime": 489.7721,
107
+ "eval_samples_per_second": 22.172,
108
+ "eval_steps_per_second": 0.347,
109
+ "eval_wer": 1.13066542182991,
110
+ "step": 1000
111
+ },
112
+ {
113
+ "epoch": 13.1,
114
+ "eval_loss": 0.3943102955818176,
115
+ "eval_runtime": 478.1637,
116
+ "eval_samples_per_second": 22.71,
117
+ "eval_steps_per_second": 0.356,
118
+ "eval_wer": 1.0963758275335258,
119
+ "step": 1100
120
+ },
121
+ {
122
+ "epoch": 14.29,
123
+ "eval_loss": 0.3974030613899231,
124
+ "eval_runtime": 476.6101,
125
+ "eval_samples_per_second": 22.784,
126
+ "eval_steps_per_second": 0.357,
127
+ "eval_wer": 1.0893630113732813,
128
+ "step": 1200
129
+ },
130
+ {
131
+ "epoch": 15.0,
132
+ "step": 1260,
133
+ "total_flos": 2.676196803813189e+19,
134
+ "train_loss": 1.7017262231735957,
135
+ "train_runtime": 141338.6512,
136
+ "train_samples_per_second": 1.71,
137
+ "train_steps_per_second": 0.009
138
+ }
139
+ ],
140
+ "max_steps": 1260,
141
+ "num_train_epochs": 15,
142
+ "total_flos": 2.676196803813189e+19,
143
+ "trial_name": null,
144
+ "trial_params": null
145
+ }