kapilkd13 commited on
Commit
f08c82a
1 Parent(s): c7ff3d3

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +14 -0
  2. eval_results.json +9 -0
  3. train_results.json +8 -0
  4. trainer_state.json +127 -0
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.39,
3
+ "eval_loss": 0.7122135758399963,
4
+ "eval_runtime": 94.1287,
5
+ "eval_samples": 2095,
6
+ "eval_samples_per_second": 22.257,
7
+ "eval_steps_per_second": 2.783,
8
+ "eval_wer": 1.010687605649163,
9
+ "train_loss": 2.1192366943359375,
10
+ "train_runtime": 2559.907,
11
+ "train_samples": 4711,
12
+ "train_samples_per_second": 6.25,
13
+ "train_steps_per_second": 0.391
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.39,
3
+ "eval_loss": 0.7122135758399963,
4
+ "eval_runtime": 94.1287,
5
+ "eval_samples": 2095,
6
+ "eval_samples_per_second": 22.257,
7
+ "eval_steps_per_second": 2.783,
8
+ "eval_wer": 1.010687605649163
9
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.39,
3
+ "train_loss": 2.1192366943359375,
4
+ "train_runtime": 2559.907,
5
+ "train_samples": 4711,
6
+ "train_samples_per_second": 6.25,
7
+ "train_steps_per_second": 0.391
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.389830508474576,
5
+ "global_step": 1000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.34,
12
+ "eval_loss": 4.261892318725586,
13
+ "eval_runtime": 94.2977,
14
+ "eval_samples_per_second": 22.217,
15
+ "eval_steps_per_second": 2.778,
16
+ "eval_wer": 0.9999454713997492,
17
+ "step": 100
18
+ },
19
+ {
20
+ "epoch": 0.68,
21
+ "eval_loss": 3.344686508178711,
22
+ "eval_runtime": 94.5451,
23
+ "eval_samples_per_second": 22.159,
24
+ "eval_steps_per_second": 2.771,
25
+ "eval_wer": 1.0,
26
+ "step": 200
27
+ },
28
+ {
29
+ "epoch": 1.02,
30
+ "eval_loss": 2.064770221710205,
31
+ "eval_runtime": 92.8264,
32
+ "eval_samples_per_second": 22.569,
33
+ "eval_steps_per_second": 2.822,
34
+ "eval_wer": 1.0030536016140466,
35
+ "step": 300
36
+ },
37
+ {
38
+ "epoch": 1.36,
39
+ "eval_loss": 1.2480711936950684,
40
+ "eval_runtime": 92.4166,
41
+ "eval_samples_per_second": 22.669,
42
+ "eval_steps_per_second": 2.835,
43
+ "eval_wer": 1.0047439882218223,
44
+ "step": 400
45
+ },
46
+ {
47
+ "epoch": 1.69,
48
+ "learning_rate": 0.000188625,
49
+ "loss": 3.7472,
50
+ "step": 500
51
+ },
52
+ {
53
+ "epoch": 1.69,
54
+ "eval_loss": 1.077250361442566,
55
+ "eval_runtime": 92.9428,
56
+ "eval_samples_per_second": 22.541,
57
+ "eval_steps_per_second": 2.819,
58
+ "eval_wer": 1.011014777250668,
59
+ "step": 500
60
+ },
61
+ {
62
+ "epoch": 2.03,
63
+ "eval_loss": 0.9297690987586975,
64
+ "eval_runtime": 92.8184,
65
+ "eval_samples_per_second": 22.571,
66
+ "eval_steps_per_second": 2.823,
67
+ "eval_wer": 1.0173946234800153,
68
+ "step": 600
69
+ },
70
+ {
71
+ "epoch": 2.37,
72
+ "eval_loss": 0.8263903856277466,
73
+ "eval_runtime": 92.5375,
74
+ "eval_samples_per_second": 22.639,
75
+ "eval_steps_per_second": 2.831,
76
+ "eval_wer": 1.0098151480451496,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 2.71,
81
+ "eval_loss": 0.7596059441566467,
82
+ "eval_runtime": 92.5009,
83
+ "eval_samples_per_second": 22.648,
84
+ "eval_steps_per_second": 2.832,
85
+ "eval_wer": 1.007470418234364,
86
+ "step": 800
87
+ },
88
+ {
89
+ "epoch": 3.05,
90
+ "eval_loss": 0.7255838513374329,
91
+ "eval_runtime": 92.7616,
92
+ "eval_samples_per_second": 22.585,
93
+ "eval_steps_per_second": 2.824,
94
+ "eval_wer": 1.0065979606303506,
95
+ "step": 900
96
+ },
97
+ {
98
+ "epoch": 3.39,
99
+ "learning_rate": 1.1249999999999998e-06,
100
+ "loss": 0.4913,
101
+ "step": 1000
102
+ },
103
+ {
104
+ "epoch": 3.39,
105
+ "eval_loss": 0.7122135758399963,
106
+ "eval_runtime": 92.98,
107
+ "eval_samples_per_second": 22.532,
108
+ "eval_steps_per_second": 2.818,
109
+ "eval_wer": 1.010687605649163,
110
+ "step": 1000
111
+ },
112
+ {
113
+ "epoch": 3.39,
114
+ "step": 1000,
115
+ "total_flos": 2.0204530018974664e+18,
116
+ "train_loss": 2.1192366943359375,
117
+ "train_runtime": 2559.907,
118
+ "train_samples_per_second": 6.25,
119
+ "train_steps_per_second": 0.391
120
+ }
121
+ ],
122
+ "max_steps": 1000,
123
+ "num_train_epochs": 4,
124
+ "total_flos": 2.0204530018974664e+18,
125
+ "trial_name": null,
126
+ "trial_params": null
127
+ }