juancopi81 commited on
Commit
566e989
1 Parent(s): f857640

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 1.03,
3
- "eval_loss": 0.1700439453125,
4
- "eval_runtime": 3035.8435,
5
- "eval_samples_per_second": 5.112,
6
- "eval_steps_per_second": 0.16,
7
- "eval_wer": 5.696169637752716,
8
- "train_loss": 0.0865213623046875,
9
- "train_runtime": 8011.6489,
10
- "train_samples_per_second": 3.994,
11
- "train_steps_per_second": 0.062
12
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 0.2337646484375,
4
+ "eval_runtime": 1889.9466,
5
+ "eval_samples_per_second": 8.212,
6
+ "eval_steps_per_second": 0.257,
7
+ "eval_wer": 95.61808118081181,
8
+ "train_loss": 0.1674322509765625,
9
+ "train_runtime": 2968.1959,
10
+ "train_samples_per_second": 2.156,
11
+ "train_steps_per_second": 0.034
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.03,
3
- "eval_loss": 0.1700439453125,
4
- "eval_runtime": 3035.8435,
5
- "eval_samples_per_second": 5.112,
6
- "eval_steps_per_second": 0.16,
7
- "eval_wer": 5.696169637752716
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 0.2337646484375,
4
+ "eval_runtime": 1889.9466,
5
+ "eval_samples_per_second": 8.212,
6
+ "eval_steps_per_second": 0.257,
7
+ "eval_wer": 95.61808118081181
8
  }
runs/Dec16_21-53-30_132-145-140-45/events.out.tfevents.1671232633.132-145-140-45.989061.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:380604b58743c271b181672a813088baca9c93bea5d078b2f276597a3aa71fa1
3
+ size 352
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 1.03,
3
- "train_loss": 0.0865213623046875,
4
- "train_runtime": 8011.6489,
5
- "train_samples_per_second": 3.994,
6
- "train_steps_per_second": 0.062
7
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "train_loss": 0.1674322509765625,
4
+ "train_runtime": 2968.1959,
5
+ "train_samples_per_second": 2.156,
6
+ "train_steps_per_second": 0.034
7
  }
trainer_state.json CHANGED
@@ -1,154 +1,58 @@
1
  {
2
- "best_metric": 5.696169637752716,
3
- "best_model_checkpoint": "./checkpoint-500",
4
- "epoch": 1.03,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.05,
12
- "learning_rate": 3.4043195900439816e-07,
13
- "loss": 0.0907,
14
  "step": 25
15
  },
16
  {
17
- "epoch": 0.1,
18
- "learning_rate": 4.203103093438967e-07,
19
- "loss": 0.0802,
20
  "step": 50
21
  },
22
  {
23
- "epoch": 0.15,
24
- "learning_rate": 4.6583071503011386e-07,
25
- "loss": 0.0774,
26
  "step": 75
27
  },
28
  {
29
- "epoch": 0.2,
30
- "learning_rate": 4.978065189231237e-07,
31
- "loss": 0.0746,
32
  "step": 100
33
  },
34
  {
35
- "epoch": 0.25,
36
- "learning_rate": 5e-07,
37
- "loss": 0.0834,
38
- "step": 125
39
- },
40
- {
41
- "epoch": 0.3,
42
- "learning_rate": 5e-07,
43
- "loss": 0.0775,
44
- "step": 150
45
- },
46
- {
47
- "epoch": 0.35,
48
- "learning_rate": 5e-07,
49
- "loss": 0.0784,
50
- "step": 175
51
- },
52
- {
53
- "epoch": 0.4,
54
- "learning_rate": 5e-07,
55
- "loss": 0.0756,
56
- "step": 200
57
- },
58
- {
59
- "epoch": 0.45,
60
- "learning_rate": 5e-07,
61
- "loss": 0.0744,
62
- "step": 225
63
- },
64
- {
65
- "epoch": 0.5,
66
- "learning_rate": 5e-07,
67
- "loss": 0.0801,
68
- "step": 250
69
- },
70
- {
71
- "epoch": 0.55,
72
- "learning_rate": 5e-07,
73
- "loss": 0.0768,
74
- "step": 275
75
- },
76
- {
77
- "epoch": 0.6,
78
- "learning_rate": 5e-07,
79
- "loss": 0.0795,
80
- "step": 300
81
- },
82
- {
83
- "epoch": 0.65,
84
- "learning_rate": 5e-07,
85
- "loss": 0.0837,
86
- "step": 325
87
- },
88
- {
89
- "epoch": 0.7,
90
- "learning_rate": 5e-07,
91
- "loss": 0.0827,
92
- "step": 350
93
- },
94
- {
95
- "epoch": 0.75,
96
- "learning_rate": 5e-07,
97
- "loss": 0.0858,
98
- "step": 375
99
- },
100
- {
101
- "epoch": 0.8,
102
- "learning_rate": 5e-07,
103
- "loss": 0.088,
104
- "step": 400
105
- },
106
- {
107
- "epoch": 0.85,
108
- "learning_rate": 5e-07,
109
- "loss": 0.0865,
110
- "step": 425
111
- },
112
- {
113
- "epoch": 0.9,
114
- "learning_rate": 5e-07,
115
- "loss": 0.0911,
116
- "step": 450
117
- },
118
- {
119
- "epoch": 0.95,
120
- "learning_rate": 5e-07,
121
- "loss": 0.0976,
122
- "step": 475
123
- },
124
- {
125
- "epoch": 1.03,
126
- "learning_rate": 5e-07,
127
- "loss": 0.1665,
128
- "step": 500
129
- },
130
- {
131
- "epoch": 1.03,
132
- "eval_loss": 0.1700439453125,
133
- "eval_runtime": 3050.6887,
134
- "eval_samples_per_second": 5.087,
135
- "eval_steps_per_second": 0.159,
136
- "eval_wer": 5.696169637752716,
137
- "step": 500
138
  },
139
  {
140
- "epoch": 1.03,
141
- "step": 500,
142
- "total_flos": 3.2659357379539763e+19,
143
- "train_loss": 0.0865213623046875,
144
- "train_runtime": 8011.6489,
145
- "train_samples_per_second": 3.994,
146
- "train_steps_per_second": 0.062
147
  }
148
  ],
149
- "max_steps": 500,
150
  "num_train_epochs": 9223372036854775807,
151
- "total_flos": 3.2659357379539763e+19,
152
  "trial_name": null,
153
  "trial_params": null
154
  }
 
1
  {
2
+ "best_metric": 95.61808118081181,
3
+ "best_model_checkpoint": "./checkpoint-100",
4
+ "epoch": 1.0,
5
+ "global_step": 100,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.25,
12
+ "learning_rate": 3e-05,
13
+ "loss": 0.2442,
14
  "step": 25
15
  },
16
  {
17
+ "epoch": 0.5,
18
+ "learning_rate": 3e-05,
19
+ "loss": 0.1382,
20
  "step": 50
21
  },
22
  {
23
+ "epoch": 0.75,
24
+ "learning_rate": 3e-05,
25
+ "loss": 0.1442,
26
  "step": 75
27
  },
28
  {
29
+ "epoch": 1.0,
30
+ "learning_rate": 3e-05,
31
+ "loss": 0.1432,
32
  "step": 100
33
  },
34
  {
35
+ "epoch": 1.0,
36
+ "eval_loss": 0.2337646484375,
37
+ "eval_runtime": 1865.6333,
38
+ "eval_samples_per_second": 8.319,
39
+ "eval_steps_per_second": 0.26,
40
+ "eval_wer": 95.61808118081181,
41
+ "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  },
43
  {
44
+ "epoch": 1.0,
45
+ "step": 100,
46
+ "total_flos": 6.531871475907953e+18,
47
+ "train_loss": 0.1674322509765625,
48
+ "train_runtime": 2968.1959,
49
+ "train_samples_per_second": 2.156,
50
+ "train_steps_per_second": 0.034
51
  }
52
  ],
53
+ "max_steps": 100,
54
  "num_train_epochs": 9223372036854775807,
55
+ "total_flos": 6.531871475907953e+18,
56
  "trial_name": null,
57
  "trial_params": null
58
  }