shpotes commited on
Commit
1f68524
1 Parent(s): fa2a9d2

Training in progress, step 500

Browse files
all_results.json DELETED
@@ -1,14 +0,0 @@
1
- {
2
- "epoch": 500.0,
3
- "eval_loss": 0.6521313190460205,
4
- "eval_runtime": 134.0142,
5
- "eval_samples": 2609,
6
- "eval_samples_per_second": 19.468,
7
- "eval_steps_per_second": 0.246,
8
- "eval_wer": 0.40601336302895324,
9
- "train_loss": 0.11533763631184896,
10
- "train_runtime": 176050.2174,
11
- "train_samples": 5705,
12
- "train_samples_per_second": 16.203,
13
- "train_steps_per_second": 0.102
14
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
errs DELETED
The diff for this file is too large to render. See raw diff
 
eval_results.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "epoch": 500.0,
3
- "eval_loss": 0.6521313190460205,
4
- "eval_runtime": 134.0142,
5
- "eval_samples": 2609,
6
- "eval_samples_per_second": 19.468,
7
- "eval_steps_per_second": 0.246,
8
- "eval_wer": 0.40601336302895324
9
- }
 
 
 
 
 
 
 
 
 
 
logs DELETED
@@ -1,320 +0,0 @@
1
- 01/26/2022 10:56:56 - WARNING - __main__ - Process rank: -1, device: cuda:0, n_gpu: 1distributed training: False, 16-bits training: True
2
- 01/26/2022 10:56:56 - INFO - __main__ - Training/evaluation parameters TrainingArguments(
3
- _n_gpu=1,
4
- adafactor=False,
5
- adam_beta1=0.9,
6
- adam_beta2=0.999,
7
- adam_epsilon=1e-08,
8
- bf16=False,
9
- bf16_full_eval=False,
10
- dataloader_drop_last=False,
11
- dataloader_num_workers=0,
12
- dataloader_pin_memory=True,
13
- ddp_bucket_cap_mb=None,
14
- ddp_find_unused_parameters=None,
15
- debug=[],
16
- deepspeed=None,
17
- disable_tqdm=False,
18
- do_eval=True,
19
- do_predict=False,
20
- do_train=True,
21
- eval_accumulation_steps=None,
22
- eval_steps=500,
23
- evaluation_strategy=IntervalStrategy.STEPS,
24
- fp16=True,
25
- fp16_backend=auto,
26
- fp16_full_eval=False,
27
- fp16_opt_level=O1,
28
- gradient_accumulation_steps=2,
29
- gradient_checkpointing=True,
30
- greater_is_better=None,
31
- group_by_length=True,
32
- half_precision_backend=auto,
33
- hub_model_id=None,
34
- hub_strategy=HubStrategy.EVERY_SAVE,
35
- hub_token=<HUB_TOKEN>,
36
- ignore_data_skip=False,
37
- label_names=None,
38
- label_smoothing_factor=0.0,
39
- learning_rate=0.0003,
40
- length_column_name=input_length,
41
- load_best_model_at_end=False,
42
- local_rank=-1,
43
- log_level=-1,
44
- log_level_replica=-1,
45
- log_on_each_node=True,
46
- logging_dir=./runs/Jan26_10-56-56_ganymede.eafit.edu.co,
47
- logging_first_step=False,
48
- logging_nan_inf_filter=True,
49
- logging_steps=100,
50
- logging_strategy=IntervalStrategy.STEPS,
51
- lr_scheduler_type=SchedulerType.COSINE,
52
- max_grad_norm=1.0,
53
- max_steps=-1,
54
- metric_for_best_model=None,
55
- mp_parameters=,
56
- no_cuda=False,
57
- num_train_epochs=500.0,
58
- optim=OptimizerNames.ADAMW_HF,
59
- output_dir=./,
60
- overwrite_output_dir=True,
61
- past_index=-1,
62
- per_device_eval_batch_size=80,
63
- per_device_train_batch_size=80,
64
- prediction_loss_only=False,
65
- push_to_hub=True,
66
- push_to_hub_model_id=None,
67
- push_to_hub_organization=None,
68
- push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
69
- remove_unused_columns=True,
70
- report_to=['wandb'],
71
- resume_from_checkpoint=None,
72
- run_name=cosine+drop_proj+low_specaugment-300M,
73
- save_on_each_node=False,
74
- save_steps=500,
75
- save_strategy=IntervalStrategy.STEPS,
76
- save_total_limit=1,
77
- seed=42,
78
- sharded_ddp=[],
79
- skip_memory_metrics=True,
80
- tf32=None,
81
- tpu_metrics_debug=False,
82
- tpu_num_cores=None,
83
- use_legacy_prediction_loop=False,
84
- warmup_ratio=0.0,
85
- warmup_steps=500,
86
- weight_decay=0.0,
87
- xpu_backend=None,
88
- )
89
- 01/26/2022 10:57:00 - WARNING - datasets.builder - Reusing dataset common_voice (/home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba)
90
- 01/26/2022 10:57:02 - WARNING - datasets.builder - Reusing dataset common_voice (/home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba)
91
- 01/26/2022 10:57:02 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba/cache-f4479ce33e07f5c7.arrow
92
- 01/26/2022 10:57:02 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba/cache-105cefde64f772a9.arrow
93
- 01/26/2022 10:58:44 - WARNING - huggingface_hub.repository - /home/sagrilaft/Project/audio/xls-r-et/./ is already a clone of https://huggingface.co/shpotes/xls-r-et. Make sure you pull the latest changes with `repo.git_pull()`.
94
-
95
- {'loss': 4.5903, 'learning_rate': 0.00019800000000000002, 'epoch': 2.78}
96
- {'loss': 2.9083, 'learning_rate': 0.000398, 'epoch': 5.56}
97
- {'loss': 1.2823, 'learning_rate': 0.000598, 'epoch': 8.33}
98
- {'loss': 0.3962, 'learning_rate': 0.0007980000000000001, 'epoch': 11.11}
99
- {'loss': 0.3034, 'learning_rate': 0.000998, 'epoch': 13.89}
100
- {'eval_loss': 0.38567885756492615, 'eval_wer': 0.4354438434616608, 'eval_runtime': 133.1769, 'eval_samples_per_second': 19.59, 'eval_steps_per_second': 0.248, 'epoch': 13.89}
101
- {'loss': 0.2639, 'learning_rate': 0.0009999210371864342, 'epoch': 16.67}
102
- {'loss': 0.2354, 'learning_rate': 0.0009996809758056298, 'epoch': 19.44}
103
- {'loss': 0.2158, 'learning_rate': 0.000999279885163942, 'epoch': 22.22}
104
- {'loss': 0.2063, 'learning_rate': 0.000998717894518502, 'epoch': 25.0}
105
- {'loss': 0.1926, 'learning_rate': 0.000997995184978743, 'epoch': 27.78}
106
- {'eval_loss': 0.4142022132873535, 'eval_wer': 0.4174355711104041, 'eval_runtime': 135.7258, 'eval_samples_per_second': 19.223, 'eval_steps_per_second': 0.243, 'epoch': 27.78}
107
- {'loss': 0.1771, 'learning_rate': 0.0009971119894480345, 'epoch': 30.56}
108
- {'loss': 0.1709, 'learning_rate': 0.0009960685925486266, 'epoch': 33.33}
109
- {'loss': 0.1724, 'learning_rate': 0.0009948653305299256, 'epoch': 36.11}
110
- {'loss': 0.1632, 'learning_rate': 0.0009935025911601335, 'epoch': 38.89}
111
- {'loss': 0.1609, 'learning_rate': 0.0009919808136012837, 'epoch': 41.67}
112
- {'eval_loss': 0.4701250195503235, 'eval_wer': 0.42958956411072224, 'eval_runtime': 133.1213, 'eval_samples_per_second': 19.599, 'eval_steps_per_second': 0.248, 'epoch': 41.67}
113
- 01/26/2022 15:02:33 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb']. This may take a bit of time if the files are large.
114
- {'loss': 0.1521, 'learning_rate': 0.0009903004882677155, 'epoch': 44.44}
115
- {'loss': 0.1531, 'learning_rate': 0.0009884621566680308, 'epoch': 47.22}
116
- {'loss': 0.1514, 'learning_rate': 0.0009864664112305846, 'epoch': 50.0}
117
- {'loss': 0.1468, 'learning_rate': 0.0009843138951125682, 'epoch': 52.78}
118
- {'loss': 0.1501, 'learning_rate': 0.000982005301992741, 'epoch': 55.56}
119
- {'eval_loss': 0.45478546619415283, 'eval_wer': 0.43805281578110083, 'eval_runtime': 133.376, 'eval_samples_per_second': 19.561, 'eval_steps_per_second': 0.247, 'epoch': 55.56}
120
- {'loss': 0.1427, 'learning_rate': 0.0009795413758478834, 'epoch': 58.33}
121
- {'loss': 0.1441, 'learning_rate': 0.0009769229107130409, 'epoch': 61.11}
122
- {'loss': 0.1399, 'learning_rate': 0.0009741507504256327, 'epoch': 63.89}
123
- {'loss': 0.1379, 'learning_rate': 0.0009712257883535152, 'epoch': 66.67}
124
- {'loss': 0.1382, 'learning_rate': 0.0009681489671070803, 'epoch': 69.44}
125
- {'eval_loss': 0.523300290107727, 'eval_wer': 0.4544066178810054, 'eval_runtime': 131.9566, 'eval_samples_per_second': 19.772, 'eval_steps_per_second': 0.25, 'epoch': 69.44}
126
- {'loss': 0.1372, 'learning_rate': 0.0009649212782354872, 'epoch': 72.22}
127
- {'loss': 0.1345, 'learning_rate': 0.0009615437619071199, 'epoch': 75.0}
128
- {'loss': 0.1346, 'learning_rate': 0.0009580175065743799, 'epoch': 77.78}
129
- {'loss': 0.1367, 'learning_rate': 0.0009543436486229162, 'epoch': 80.56}
130
- {'loss': 0.1287, 'learning_rate': 0.0009505233720054086, 'epoch': 83.33}
131
- {'eval_loss': 0.48360341787338257, 'eval_wer': 0.43658924594336623, 'eval_runtime': 132.2498, 'eval_samples_per_second': 19.728, 'eval_steps_per_second': 0.25, 'epoch': 83.33}
132
- {'loss': 0.1226, 'learning_rate': 0.0009465579078600233, 'epoch': 86.11}
133
- {'loss': 0.1258, 'learning_rate': 0.0009424485341136599, 'epoch': 88.89}
134
- {'loss': 0.1222, 'learning_rate': 0.0009381965750701229, 'epoch': 91.67}
135
- {'loss': 0.1182, 'learning_rate': 0.0009338034009833446, 'epoch': 94.44}
136
- {'loss': 0.1164, 'learning_rate': 0.0009292704276158022, 'epoch': 97.22}
137
- {'eval_loss': 0.5202445983886719, 'eval_wer': 0.43948456888323256, 'eval_runtime': 132.7793, 'eval_samples_per_second': 19.649, 'eval_steps_per_second': 0.249, 'epoch': 97.22}
138
- {'loss': 0.1212, 'learning_rate': 0.0009245991157822682, 'epoch': 100.0}
139
- {'loss': 0.1139, 'learning_rate': 0.000919790970879042, 'epoch': 102.78}
140
- {'loss': 0.115, 'learning_rate': 0.000914847542398815, 'epoch': 105.56}
141
- {'loss': 0.1123, 'learning_rate': 0.0009097704234313245, 'epoch': 108.33}
142
- {'loss': 0.1101, 'learning_rate': 0.0009045612501499573, 'epoch': 111.11}
143
- {'eval_loss': 0.5120447874069214, 'eval_wer': 0.43827553293032134, 'eval_runtime': 131.3001, 'eval_samples_per_second': 19.871, 'eval_steps_per_second': 0.251, 'epoch': 111.11}
144
- {'loss': 0.1092, 'learning_rate': 0.0008992217012844713, 'epoch': 113.89}
145
- {'loss': 0.1104, 'learning_rate': 0.0008937534975799996, 'epoch': 116.67}
146
- {'loss': 0.1021, 'learning_rate': 0.0008881584012425165, 'epoch': 119.44}
147
- {'loss': 0.1063, 'learning_rate': 0.0008824382153709421, 'epoch': 122.22}
148
- {'loss': 0.1107, 'learning_rate': 0.0008765947833760678, 'epoch': 125.0}
149
- {'eval_loss': 0.5130612850189209, 'eval_wer': 0.4446706967865097, 'eval_runtime': 133.0961, 'eval_samples_per_second': 19.602, 'eval_steps_per_second': 0.248, 'epoch': 125.0}
150
- {'loss': 0.1054, 'learning_rate': 0.000870629988386491, 'epoch': 127.78}
151
- {'loss': 0.1037, 'learning_rate': 0.0008645457526417502, 'epoch': 130.56}
152
- {'loss': 0.1, 'learning_rate': 0.0008583440368728572, 'epoch': 133.33}
153
- {'loss': 0.0967, 'learning_rate': 0.0008520268396704223, 'epoch': 136.11}
154
- {'loss': 0.0942, 'learning_rate': 0.0008455961968405809, 'epoch': 138.89}
155
- {'eval_loss': 0.5256752967834473, 'eval_wer': 0.43748011454024816, 'eval_runtime': 133.1352, 'eval_samples_per_second': 19.597, 'eval_steps_per_second': 0.248, 'epoch': 138.89}
156
- {'loss': 0.0987, 'learning_rate': 0.0008390541807489265, 'epoch': 141.67}
157
- {'loss': 0.094, 'learning_rate': 0.0008324028996526611, 'epoch': 144.44}
158
- {'loss': 0.0935, 'learning_rate': 0.0008256444970211793, 'epoch': 147.22}
159
- {'loss': 0.0906, 'learning_rate': 0.000818781150845306, 'epoch': 150.0}
160
- {'loss': 0.0909, 'learning_rate': 0.0008118150729354068, 'epoch': 152.78}
161
- {'eval_loss': 0.5312919020652771, 'eval_wer': 0.47133312122176263, 'eval_runtime': 133.5185, 'eval_samples_per_second': 19.54, 'eval_steps_per_second': 0.247, 'epoch': 152.78}
162
- {'loss': 0.0881, 'learning_rate': 0.0008047485082086017, 'epoch': 155.56}
163
- {'loss': 0.0921, 'learning_rate': 0.0007975837339653084, 'epoch': 158.33}
164
- {'loss': 0.0838, 'learning_rate': 0.0007903230591553503, 'epoch': 161.11}
165
- {'loss': 0.0775, 'learning_rate': 0.0007829688236338643, 'epoch': 163.89}
166
- {'loss': 0.0807, 'learning_rate': 0.0007755233974072504, 'epoch': 166.67}
167
- {'eval_loss': 0.5847254991531372, 'eval_wer': 0.44708876869233216, 'eval_runtime': 133.1812, 'eval_samples_per_second': 19.59, 'eval_steps_per_second': 0.248, 'epoch': 166.67}
168
- {'loss': 0.0801, 'learning_rate': 0.0007679891798694021, 'epoch': 169.44}
169
- {'loss': 0.0952, 'learning_rate': 0.000760368599028469, 'epoch': 172.22}
170
- {'loss': 0.0813, 'learning_rate': 0.0007526641107243966, 'epoch': 175.0}
171
- {'loss': 0.0795, 'learning_rate': 0.0007448781978374969, 'epoch': 177.78}
172
- {'loss': 0.0767, 'learning_rate': 0.0007370133694883051, 'epoch': 180.56}
173
- {'eval_loss': 0.5318175554275513, 'eval_wer': 0.4534521158129176, 'eval_runtime': 135.804, 'eval_samples_per_second': 19.212, 'eval_steps_per_second': 0.243, 'epoch': 180.56}
174
- {'loss': 0.0762, 'learning_rate': 0.0007290721602289801, 'epoch': 183.33}
175
- {'loss': 0.0729, 'learning_rate': 0.0007210571292265096, 'epoch': 186.11}
176
- {'loss': 0.0751, 'learning_rate': 0.0007129708594379816, 'epoch': 188.89}
177
- {'loss': 0.0743, 'learning_rate': 0.0007048159567781905, 'epoch': 191.67}
178
- {'loss': 0.0729, 'learning_rate': 0.0006965950492798443, 'epoch': 194.44}
179
- {'eval_loss': 0.5796982645988464, 'eval_wer': 0.4584155265669742, 'eval_runtime': 132.2018, 'eval_samples_per_second': 19.735, 'eval_steps_per_second': 0.25, 'epoch': 194.44}
180
- {'loss': 0.0791, 'learning_rate': 0.0006883107862466433, 'epoch': 197.22}
181
- {'loss': 0.0737, 'learning_rate': 0.0006799658373995054, 'epoch': 200.0}
182
- {'loss': 0.0694, 'learning_rate': 0.0006715628920162093, 'epoch': 202.78}
183
- {'loss': 0.0687, 'learning_rate': 0.0006631046580647384, 'epoch': 205.56}
184
- {'loss': 0.072, 'learning_rate': 0.0006545938613305993, 'epoch': 208.33}
185
- {'eval_loss': 0.5266388654708862, 'eval_wer': 0.44339802736239264, 'eval_runtime': 130.3709, 'eval_samples_per_second': 20.012, 'eval_steps_per_second': 0.253, 'epoch': 208.33}
186
- {'loss': 0.0647, 'learning_rate': 0.000646033244538398, 'epoch': 211.11}
187
- {'loss': 0.0631, 'learning_rate': 0.000637425566467959, 'epoch': 213.89}
188
- {'loss': 0.0606, 'learning_rate': 0.0006287736010652693, 'epoch': 216.67}
189
- {'loss': 0.0645, 'learning_rate': 0.000620080136548535, 'epoch': 219.44}
190
- {'loss': 0.0593, 'learning_rate': 0.0006113479745096386, 'epoch': 222.22}
191
- {'eval_loss': 0.579177737236023, 'eval_wer': 0.43888005090677695, 'eval_runtime': 133.0716, 'eval_samples_per_second': 19.606, 'eval_steps_per_second': 0.248, 'epoch': 222.22}
192
- {'loss': 0.0596, 'learning_rate': 0.0006025799290112865, 'epoch': 225.0}
193
- {'loss': 0.0606, 'learning_rate': 0.0005937788256801371, 'epoch': 227.78}
194
- {'loss': 0.0591, 'learning_rate': 0.0005849475007962031, 'epoch': 230.56}
195
- {'loss': 0.0544, 'learning_rate': 0.0005760888003788196, 'epoch': 233.33}
196
- {'loss': 0.0524, 'learning_rate': 0.0005672055792694753, 'epoch': 236.11}
197
- {'eval_loss': 0.5740395784378052, 'eval_wer': 0.43732103086223356, 'eval_runtime': 132.5642, 'eval_samples_per_second': 19.681, 'eval_steps_per_second': 0.249, 'epoch': 236.11}
198
- {'loss': 0.0504, 'learning_rate': 0.0005583007002117978, 'epoch': 238.89}
199
- {'loss': 0.0494, 'learning_rate': 0.0005493770329289953, 'epoch': 241.67}
200
- {'loss': 0.0484, 'learning_rate': 0.0005404374531990474, 'epoch': 244.44}
201
- {'loss': 0.0489, 'learning_rate': 0.0005314848419279442, 'epoch': 247.22}
202
- {'loss': 0.0494, 'learning_rate': 0.0005225220842212748, 'epoch': 250.0}
203
- {'eval_loss': 0.5520852208137512, 'eval_wer': 0.44358892777601017, 'eval_runtime': 133.6258, 'eval_samples_per_second': 19.525, 'eval_steps_per_second': 0.247, 'epoch': 250.0}
204
- {'loss': 0.0499, 'learning_rate': 0.0005135520684544602, 'epoch': 252.78}
205
- {'loss': 0.0487, 'learning_rate': 0.0005045776853419344, 'epoch': 255.56}
206
- {'loss': 0.0523, 'learning_rate': 0.0004956018270055703, 'epoch': 258.33}
207
- {'loss': 0.0479, 'learning_rate': 0.00048662738604265206, 'epoch': 261.11}
208
- {'loss': 0.0469, 'learning_rate': 0.0004776572545936954, 'epoch': 263.89}
209
- {'eval_loss': 0.5630596876144409, 'eval_wer': 0.4345847916003818, 'eval_runtime': 130.7272, 'eval_samples_per_second': 19.958, 'eval_steps_per_second': 0.252, 'epoch': 263.89}
210
- {'loss': 0.0467, 'learning_rate': 0.0004686943234104146, 'epoch': 266.67}
211
- {'loss': 0.0438, 'learning_rate': 0.00045974148092413597, 'epoch': 269.44}
212
- {'loss': 0.0422, 'learning_rate': 0.00045080161231496064, 'epoch': 272.22}
213
- {'loss': 0.042, 'learning_rate': 0.00044187759858197486, 'epoch': 275.0}
214
- {'loss': 0.0417, 'learning_rate': 0.0004329723156148063, 'epoch': 277.78}
215
- {'eval_loss': 0.5777372121810913, 'eval_wer': 0.43057588291441296, 'eval_runtime': 130.7332, 'eval_samples_per_second': 19.957, 'eval_steps_per_second': 0.252, 'epoch': 277.78}
216
- {'loss': 0.0406, 'learning_rate': 0.0004240886332668285, 'epoch': 280.56}
217
- {'loss': 0.0385, 'learning_rate': 0.00041522941443031025, 'epoch': 283.33}
218
- {'loss': 0.0384, 'learning_rate': 0.0004063975141138074, 'epoch': 286.11}
219
- {'loss': 0.0369, 'learning_rate': 0.00039759577852209704, 'epoch': 288.89}
220
- {'loss': 0.0379, 'learning_rate': 0.0003888270441389465, 'epoch': 291.67}
221
- {'eval_loss': 0.5934527516365051, 'eval_wer': 0.42828507795100224, 'eval_runtime': 131.6738, 'eval_samples_per_second': 19.814, 'eval_steps_per_second': 0.251, 'epoch': 291.67}
222
- {'loss': 0.0399, 'learning_rate': 0.0003800941368130171, 'epoch': 294.44}
223
- {'loss': 0.0359, 'learning_rate': 0.0003713998708471946, 'epoch': 297.22}
224
- {'loss': 0.0345, 'learning_rate': 0.0003627470480916394, 'epoch': 300.0}
225
- {'loss': 0.0346, 'learning_rate': 0.00035413845704085215, 'epoch': 302.78}
226
- {'loss': 0.0319, 'learning_rate': 0.00034557687193504045, 'epoch': 305.56}
227
- {'eval_loss': 0.5892442464828491, 'eval_wer': 0.41880369074132995, 'eval_runtime': 130.692, 'eval_samples_per_second': 19.963, 'eval_steps_per_second': 0.253, 'epoch': 305.56}
228
- {'loss': 0.0318, 'learning_rate': 0.00033706505186608136, 'epoch': 308.33}
229
- {'loss': 0.0301, 'learning_rate': 0.00032860573988836573, 'epoch': 311.11}
230
- {'loss': 0.0322, 'learning_rate': 0.0003202016621348088, 'epoch': 313.89}
231
- {'loss': 0.0331, 'learning_rate': 0.00031185552693831594, 'epoch': 316.67}
232
- {'loss': 0.0311, 'learning_rate': 0.0003035700239589846, 'epoch': 319.44}
233
- {'eval_loss': 0.6010639071464539, 'eval_wer': 0.4210626789691378, 'eval_runtime': 132.2371, 'eval_samples_per_second': 19.73, 'eval_steps_per_second': 0.25, 'epoch': 319.44}
234
- {'loss': 0.0291, 'learning_rate': 0.00029534782331732204, 'epoch': 322.22}
235
- {'loss': 0.0287, 'learning_rate': 0.00028719157473376303, 'epoch': 325.0}
236
- {'loss': 0.0279, 'learning_rate': 0.00027918443530500935, 'epoch': 327.78}
237
- {'loss': 0.0294, 'learning_rate': 0.0002711672294401907, 'epoch': 330.56}
238
- {'loss': 0.0269, 'learning_rate': 0.00026322376817181157, 'epoch': 333.33}
239
- {'eval_loss': 0.5972930192947388, 'eval_wer': 0.4232262169901368, 'eval_runtime': 133.0245, 'eval_samples_per_second': 19.613, 'eval_steps_per_second': 0.248, 'epoch': 333.33}
240
- {'loss': 0.0251, 'learning_rate': 0.0002553566113926006, 'epoch': 336.11}
241
- {'loss': 0.0261, 'learning_rate': 0.00024756829440508705, 'epoch': 338.89}
242
- {'loss': 0.025, 'learning_rate': 0.0002398613271045611, 'epoch': 341.67}
243
- {'loss': 0.0264, 'learning_rate': 0.00023223819317022654, 'epoch': 344.44}
244
- {'loss': 0.0271, 'learning_rate': 0.00022470134926479935, 'epoch': 347.22}
245
- {'eval_loss': 0.6094068288803101, 'eval_wer': 0.4428253261215399, 'eval_runtime': 132.9769, 'eval_samples_per_second': 19.62, 'eval_steps_per_second': 0.248, 'epoch': 347.22}
246
- {'loss': 0.0246, 'learning_rate': 0.00021725322424281286, 'epoch': 350.0}
247
- {'loss': 0.0245, 'learning_rate': 0.00020989621836788614, 'epoch': 352.78}
248
- {'loss': 0.0229, 'learning_rate': 0.00020263270253920428, 'epoch': 355.56}
249
- {'loss': 0.0229, 'learning_rate': 0.00019546501752746288, 'epoch': 358.33}
250
- {'loss': 0.0236, 'learning_rate': 0.0001883954732205217, 'epoch': 361.11}
251
- {'eval_loss': 0.611167311668396, 'eval_wer': 0.42373528475978367, 'eval_runtime': 132.3797, 'eval_samples_per_second': 19.708, 'eval_steps_per_second': 0.249, 'epoch': 361.11}
252
- {'loss': 0.0229, 'learning_rate': 0.00018142634787900996, 'epoch': 363.89}
253
- {'loss': 0.0221, 'learning_rate': 0.00017455988740212576, 'epoch': 366.67}
254
- {'loss': 0.0208, 'learning_rate': 0.0001677983046038624, 'epoch': 369.44}
255
- {'loss': 0.0208, 'learning_rate': 0.00016114377849989813, 'epoch': 372.22}
256
- {'loss': 0.0202, 'learning_rate': 0.00015459845360537756, 'epoch': 375.0}
257
- {'eval_loss': 0.605171799659729, 'eval_wer': 0.4233534839325485, 'eval_runtime': 132.1498, 'eval_samples_per_second': 19.743, 'eval_steps_per_second': 0.25, 'epoch': 375.0}
258
- {'loss': 0.0197, 'learning_rate': 0.0001481644392438113, 'epoch': 377.78}
259
- {'loss': 0.0195, 'learning_rate': 0.00014184380886731607, 'epoch': 380.56}
260
- {'loss': 0.0186, 'learning_rate': 0.0001356385993884165, 'epoch': 383.33}
261
- {'loss': 0.0186, 'learning_rate': 0.00012955081052362072, 'epoch': 386.11}
262
- {'loss': 0.0175, 'learning_rate': 0.00012358240414898276, 'epoch': 388.89}
263
- {'eval_loss': 0.631072998046875, 'eval_wer': 0.4188673242125358, 'eval_runtime': 131.5592, 'eval_samples_per_second': 19.831, 'eval_steps_per_second': 0.251, 'epoch': 388.89}
264
- {'loss': 0.0164, 'learning_rate': 0.00011773530366786184, 'epoch': 391.67}
265
- {'loss': 0.0166, 'learning_rate': 0.0001120113933910767, 'epoch': 394.44}
266
- {'loss': 0.0163, 'learning_rate': 0.000106412517929661, 'epoch': 397.22}
267
- {'loss': 0.0159, 'learning_rate': 0.00010094048160041091, 'epoch': 400.0}
268
- {'loss': 0.0158, 'learning_rate': 9.559704784441814e-05, 'epoch': 402.78}
269
- {'eval_loss': 0.618556797504425, 'eval_wer': 0.4137130130448616, 'eval_runtime': 132.4333, 'eval_samples_per_second': 19.7, 'eval_steps_per_second': 0.249, 'epoch': 402.78}
270
- {'loss': 0.015, 'learning_rate': 9.038393865877726e-05, 'epoch': 405.56}
271
- {'loss': 0.0156, 'learning_rate': 8.530283404164612e-05, 'epoch': 408.33}
272
- {'loss': 0.0146, 'learning_rate': 8.03553714508441e-05, 'epoch': 411.11}
273
- {'loss': 0.0146, 'learning_rate': 7.554314527615763e-05, 'epoch': 413.89}
274
- {'loss': 0.0141, 'learning_rate': 7.086770632552514e-05, 'epoch': 416.67}
275
- {'eval_loss': 0.6352781057357788, 'eval_wer': 0.412249443207127, 'eval_runtime': 132.6132, 'eval_samples_per_second': 19.674, 'eval_steps_per_second': 0.249, 'epoch': 416.67}
276
- {'loss': 0.0138, 'learning_rate': 6.633056132526849e-05, 'epoch': 419.44}
277
- {'loss': 0.0138, 'learning_rate': 6.193317243452734e-05, 'epoch': 422.22}
278
- {'loss': 0.0131, 'learning_rate': 5.7676956774059205e-05, 'epoch': 425.0}
279
- {'loss': 0.0131, 'learning_rate': 5.356328596955179e-05, 'epoch': 427.78}
280
- {'loss': 0.013, 'learning_rate': 4.963246731369253e-05, 'epoch': 430.56}
281
- {'eval_loss': 0.6343812942504883, 'eval_wer': 0.40687241489023224, 'eval_runtime': 131.5808, 'eval_samples_per_second': 19.828, 'eval_steps_per_second': 0.251, 'epoch': 430.56}
282
- {'loss': 0.0127, 'learning_rate': 4.580635924447718e-05, 'epoch': 433.33}
283
- {'loss': 0.0126, 'learning_rate': 4.212662149914887e-05, 'epoch': 436.11}
284
- {'loss': 0.0125, 'learning_rate': 3.859443992523443e-05, 'epoch': 438.89}
285
- {'loss': 0.0127, 'learning_rate': 3.521095281819786e-05, 'epoch': 441.67}
286
- {'loss': 0.0117, 'learning_rate': 3.1977250554608205e-05, 'epoch': 444.44}
287
- {'eval_loss': 0.6442536115646362, 'eval_wer': 0.40801781737193765, 'eval_runtime': 132.782, 'eval_samples_per_second': 19.649, 'eval_steps_per_second': 0.249, 'epoch': 444.44}
288
- {'loss': 0.0122, 'learning_rate': 2.8894375240750613e-05, 'epoch': 447.22}
289
- {'loss': 0.0127, 'learning_rate': 2.5963320376792666e-05, 'epoch': 450.0}
290
- {'loss': 0.0125, 'learning_rate': 2.318503053661475e-05, 'epoch': 452.78}
291
- {'loss': 0.0121, 'learning_rate': 2.056040106340823e-05, 'epoch': 455.56}
292
- {'loss': 0.0122, 'learning_rate': 1.809027778113803e-05, 'epoch': 458.33}
293
- {'eval_loss': 0.6512282490730286, 'eval_wer': 0.4069360483614381, 'eval_runtime': 133.1307, 'eval_samples_per_second': 19.597, 'eval_steps_per_second': 0.248, 'epoch': 458.33}
294
- {'loss': 0.0113, 'learning_rate': 1.5775456721964065e-05, 'epoch': 461.11}
295
- {'loss': 0.0113, 'learning_rate': 1.3616683869708658e-05, 'epoch': 463.89}
296
- {'loss': 0.0117, 'learning_rate': 1.1614654919452406e-05, 'epoch': 466.67}
297
- {'loss': 0.0112, 'learning_rate': 9.770015053337078e-06, 'epoch': 469.44}
298
- {'loss': 0.0115, 'learning_rate': 8.083358732646206e-06, 'epoch': 472.22}
299
- {'eval_loss': 0.6556624174118042, 'eval_wer': 0.4069360483614381, 'eval_runtime': 132.4623, 'eval_samples_per_second': 19.696, 'eval_steps_per_second': 0.249, 'epoch': 472.22}
300
- {'loss': 0.0111, 'learning_rate': 6.555229506231608e-06, 'epoch': 475.0}
301
- {'loss': 0.0118, 'learning_rate': 5.186119835347169e-06, 'epoch': 477.78}
302
- {'loss': 0.0112, 'learning_rate': 3.976470934946075e-06, 'epoch': 480.56}
303
- {'loss': 0.0117, 'learning_rate': 2.92667263149321e-06, 'epoch': 483.33}
304
- {'loss': 0.0111, 'learning_rate': 2.037063237338044e-06, 'epoch': 486.11}
305
- {'eval_loss': 0.6513079404830933, 'eval_wer': 0.4059497295577474, 'eval_runtime': 131.4726, 'eval_samples_per_second': 19.844, 'eval_steps_per_second': 0.251, 'epoch': 486.11}
306
- {'loss': 0.0109, 'learning_rate': 1.3144256109794418e-06, 'epoch': 488.89}
307
- {'loss': 0.0112, 'learning_rate': 7.44394288673067e-07, 'epoch': 491.67}
308
- {'loss': 0.0113, 'learning_rate': 3.352551457218578e-07, 'epoch': 494.44}
309
- {'loss': 0.011, 'learning_rate': 8.714003300058781e-08, 'epoch': 497.22}
310
- {'loss': 0.0113, 'learning_rate': 1.2890911316176812e-10, 'epoch': 500.0}
311
- {'eval_loss': 0.6521313190460205, 'eval_wer': 0.40601336302895324, 'eval_runtime': 132.4384, 'eval_samples_per_second': 19.7, 'eval_steps_per_second': 0.249, 'epoch': 500.0}
312
- {'train_runtime': 176050.2174, 'train_samples_per_second': 16.203, 'train_steps_per_second': 0.102, 'train_loss': 0.11533763631184896, 'epoch': 500.0}
313
- ***** train metrics *****
314
- epoch = 500.0
315
- train_loss = 0.1153
316
- train_runtime = 2 days, 0:54:10.21
317
- train_samples = 5705
318
- train_samples_per_second = 16.203
319
- train_steps_per_second = 0.102
320
- 01/28/2022 11:53:03 - INFO - __main__ - *** Evaluate ***
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a841c1d52b5543205b5280dafe76d3b79f4a8e662faf5145a8f24b4ff311b969
3
  size 1262083569
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f0265c3190d4bad709792f032d753570867b48b4491c9f120d58b7516631525
3
  size 1262083569
run-300M.sh CHANGED
@@ -9,7 +9,7 @@ python src/run_speech_recognition_ctc_bnb.py \
9
  --dataset_config_name="et" \
10
  --output_dir="./" \
11
  --overwrite_output_dir \
12
- --num_train_epochs=500 \
13
  --per_device_train_batch_size=80 \
14
  --per_device_eval_batch_size=80 \
15
  --gradient_accumulation_steps=2 \
 
9
  --dataset_config_name="et" \
10
  --output_dir="./" \
11
  --overwrite_output_dir \
12
+ --num_train_epochs=100 \
13
  --per_device_train_batch_size=80 \
14
  --per_device_eval_batch_size=80 \
15
  --gradient_accumulation_steps=2 \
train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 500.0,
3
- "train_loss": 0.11533763631184896,
4
- "train_runtime": 176050.2174,
5
- "train_samples": 5705,
6
- "train_samples_per_second": 16.203,
7
- "train_steps_per_second": 0.102
8
- }
 
 
 
 
 
 
 
 
 
trainer_state.json DELETED
@@ -1,1429 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 500.0,
5
- "global_step": 18000,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 2.78,
12
- "learning_rate": 0.00019800000000000002,
13
- "loss": 4.5903,
14
- "step": 100
15
- },
16
- {
17
- "epoch": 5.56,
18
- "learning_rate": 0.000398,
19
- "loss": 2.9083,
20
- "step": 200
21
- },
22
- {
23
- "epoch": 8.33,
24
- "learning_rate": 0.000598,
25
- "loss": 1.2823,
26
- "step": 300
27
- },
28
- {
29
- "epoch": 11.11,
30
- "learning_rate": 0.0007980000000000001,
31
- "loss": 0.3962,
32
- "step": 400
33
- },
34
- {
35
- "epoch": 13.89,
36
- "learning_rate": 0.000998,
37
- "loss": 0.3034,
38
- "step": 500
39
- },
40
- {
41
- "epoch": 13.89,
42
- "eval_loss": 0.38567885756492615,
43
- "eval_runtime": 133.1769,
44
- "eval_samples_per_second": 19.59,
45
- "eval_steps_per_second": 0.248,
46
- "eval_wer": 0.4354438434616608,
47
- "step": 500
48
- },
49
- {
50
- "epoch": 16.67,
51
- "learning_rate": 0.0009999210371864342,
52
- "loss": 0.2639,
53
- "step": 600
54
- },
55
- {
56
- "epoch": 19.44,
57
- "learning_rate": 0.0009996809758056298,
58
- "loss": 0.2354,
59
- "step": 700
60
- },
61
- {
62
- "epoch": 22.22,
63
- "learning_rate": 0.000999279885163942,
64
- "loss": 0.2158,
65
- "step": 800
66
- },
67
- {
68
- "epoch": 25.0,
69
- "learning_rate": 0.000998717894518502,
70
- "loss": 0.2063,
71
- "step": 900
72
- },
73
- {
74
- "epoch": 27.78,
75
- "learning_rate": 0.000997995184978743,
76
- "loss": 0.1926,
77
- "step": 1000
78
- },
79
- {
80
- "epoch": 27.78,
81
- "eval_loss": 0.4142022132873535,
82
- "eval_runtime": 135.7258,
83
- "eval_samples_per_second": 19.223,
84
- "eval_steps_per_second": 0.243,
85
- "eval_wer": 0.4174355711104041,
86
- "step": 1000
87
- },
88
- {
89
- "epoch": 30.56,
90
- "learning_rate": 0.0009971119894480345,
91
- "loss": 0.1771,
92
- "step": 1100
93
- },
94
- {
95
- "epoch": 33.33,
96
- "learning_rate": 0.0009960685925486266,
97
- "loss": 0.1709,
98
- "step": 1200
99
- },
100
- {
101
- "epoch": 36.11,
102
- "learning_rate": 0.0009948653305299256,
103
- "loss": 0.1724,
104
- "step": 1300
105
- },
106
- {
107
- "epoch": 38.89,
108
- "learning_rate": 0.0009935025911601335,
109
- "loss": 0.1632,
110
- "step": 1400
111
- },
112
- {
113
- "epoch": 41.67,
114
- "learning_rate": 0.0009919808136012837,
115
- "loss": 0.1609,
116
- "step": 1500
117
- },
118
- {
119
- "epoch": 41.67,
120
- "eval_loss": 0.4701250195503235,
121
- "eval_runtime": 133.1213,
122
- "eval_samples_per_second": 19.599,
123
- "eval_steps_per_second": 0.248,
124
- "eval_wer": 0.42958956411072224,
125
- "step": 1500
126
- },
127
- {
128
- "epoch": 44.44,
129
- "learning_rate": 0.0009903004882677155,
130
- "loss": 0.1521,
131
- "step": 1600
132
- },
133
- {
134
- "epoch": 47.22,
135
- "learning_rate": 0.0009884621566680308,
136
- "loss": 0.1531,
137
- "step": 1700
138
- },
139
- {
140
- "epoch": 50.0,
141
- "learning_rate": 0.0009864664112305846,
142
- "loss": 0.1514,
143
- "step": 1800
144
- },
145
- {
146
- "epoch": 52.78,
147
- "learning_rate": 0.0009843138951125682,
148
- "loss": 0.1468,
149
- "step": 1900
150
- },
151
- {
152
- "epoch": 55.56,
153
- "learning_rate": 0.000982005301992741,
154
- "loss": 0.1501,
155
- "step": 2000
156
- },
157
- {
158
- "epoch": 55.56,
159
- "eval_loss": 0.45478546619415283,
160
- "eval_runtime": 133.376,
161
- "eval_samples_per_second": 19.561,
162
- "eval_steps_per_second": 0.247,
163
- "eval_wer": 0.43805281578110083,
164
- "step": 2000
165
- },
166
- {
167
- "epoch": 58.33,
168
- "learning_rate": 0.0009795413758478834,
169
- "loss": 0.1427,
170
- "step": 2100
171
- },
172
- {
173
- "epoch": 61.11,
174
- "learning_rate": 0.0009769229107130409,
175
- "loss": 0.1441,
176
- "step": 2200
177
- },
178
- {
179
- "epoch": 63.89,
180
- "learning_rate": 0.0009741507504256327,
181
- "loss": 0.1399,
182
- "step": 2300
183
- },
184
- {
185
- "epoch": 66.67,
186
- "learning_rate": 0.0009712257883535152,
187
- "loss": 0.1379,
188
- "step": 2400
189
- },
190
- {
191
- "epoch": 69.44,
192
- "learning_rate": 0.0009681489671070803,
193
- "loss": 0.1382,
194
- "step": 2500
195
- },
196
- {
197
- "epoch": 69.44,
198
- "eval_loss": 0.523300290107727,
199
- "eval_runtime": 131.9566,
200
- "eval_samples_per_second": 19.772,
201
- "eval_steps_per_second": 0.25,
202
- "eval_wer": 0.4544066178810054,
203
- "step": 2500
204
- },
205
- {
206
- "epoch": 72.22,
207
- "learning_rate": 0.0009649212782354872,
208
- "loss": 0.1372,
209
- "step": 2600
210
- },
211
- {
212
- "epoch": 75.0,
213
- "learning_rate": 0.0009615437619071199,
214
- "loss": 0.1345,
215
- "step": 2700
216
- },
217
- {
218
- "epoch": 77.78,
219
- "learning_rate": 0.0009580175065743799,
220
- "loss": 0.1346,
221
- "step": 2800
222
- },
223
- {
224
- "epoch": 80.56,
225
- "learning_rate": 0.0009543436486229162,
226
- "loss": 0.1367,
227
- "step": 2900
228
- },
229
- {
230
- "epoch": 83.33,
231
- "learning_rate": 0.0009505233720054086,
232
- "loss": 0.1287,
233
- "step": 3000
234
- },
235
- {
236
- "epoch": 83.33,
237
- "eval_loss": 0.48360341787338257,
238
- "eval_runtime": 132.2498,
239
- "eval_samples_per_second": 19.728,
240
- "eval_steps_per_second": 0.25,
241
- "eval_wer": 0.43658924594336623,
242
- "step": 3000
243
- },
244
- {
245
- "epoch": 86.11,
246
- "learning_rate": 0.0009465579078600233,
247
- "loss": 0.1226,
248
- "step": 3100
249
- },
250
- {
251
- "epoch": 88.89,
252
- "learning_rate": 0.0009424485341136599,
253
- "loss": 0.1258,
254
- "step": 3200
255
- },
256
- {
257
- "epoch": 91.67,
258
- "learning_rate": 0.0009381965750701229,
259
- "loss": 0.1222,
260
- "step": 3300
261
- },
262
- {
263
- "epoch": 94.44,
264
- "learning_rate": 0.0009338034009833446,
265
- "loss": 0.1182,
266
- "step": 3400
267
- },
268
- {
269
- "epoch": 97.22,
270
- "learning_rate": 0.0009292704276158022,
271
- "loss": 0.1164,
272
- "step": 3500
273
- },
274
- {
275
- "epoch": 97.22,
276
- "eval_loss": 0.5202445983886719,
277
- "eval_runtime": 132.7793,
278
- "eval_samples_per_second": 19.649,
279
- "eval_steps_per_second": 0.249,
280
- "eval_wer": 0.43948456888323256,
281
- "step": 3500
282
- },
283
- {
284
- "epoch": 100.0,
285
- "learning_rate": 0.0009245991157822682,
286
- "loss": 0.1212,
287
- "step": 3600
288
- },
289
- {
290
- "epoch": 102.78,
291
- "learning_rate": 0.000919790970879042,
292
- "loss": 0.1139,
293
- "step": 3700
294
- },
295
- {
296
- "epoch": 105.56,
297
- "learning_rate": 0.000914847542398815,
298
- "loss": 0.115,
299
- "step": 3800
300
- },
301
- {
302
- "epoch": 108.33,
303
- "learning_rate": 0.0009097704234313245,
304
- "loss": 0.1123,
305
- "step": 3900
306
- },
307
- {
308
- "epoch": 111.11,
309
- "learning_rate": 0.0009045612501499573,
310
- "loss": 0.1101,
311
- "step": 4000
312
- },
313
- {
314
- "epoch": 111.11,
315
- "eval_loss": 0.5120447874069214,
316
- "eval_runtime": 131.3001,
317
- "eval_samples_per_second": 19.871,
318
- "eval_steps_per_second": 0.251,
319
- "eval_wer": 0.43827553293032134,
320
- "step": 4000
321
- },
322
- {
323
- "epoch": 113.89,
324
- "learning_rate": 0.0008992217012844713,
325
- "loss": 0.1092,
326
- "step": 4100
327
- },
328
- {
329
- "epoch": 116.67,
330
- "learning_rate": 0.0008937534975799996,
331
- "loss": 0.1104,
332
- "step": 4200
333
- },
334
- {
335
- "epoch": 119.44,
336
- "learning_rate": 0.0008881584012425165,
337
- "loss": 0.1021,
338
- "step": 4300
339
- },
340
- {
341
- "epoch": 122.22,
342
- "learning_rate": 0.0008824382153709421,
343
- "loss": 0.1063,
344
- "step": 4400
345
- },
346
- {
347
- "epoch": 125.0,
348
- "learning_rate": 0.0008765947833760678,
349
- "loss": 0.1107,
350
- "step": 4500
351
- },
352
- {
353
- "epoch": 125.0,
354
- "eval_loss": 0.5130612850189209,
355
- "eval_runtime": 133.0961,
356
- "eval_samples_per_second": 19.602,
357
- "eval_steps_per_second": 0.248,
358
- "eval_wer": 0.4446706967865097,
359
- "step": 4500
360
- },
361
- {
362
- "epoch": 127.78,
363
- "learning_rate": 0.000870629988386491,
364
- "loss": 0.1054,
365
- "step": 4600
366
- },
367
- {
368
- "epoch": 130.56,
369
- "learning_rate": 0.0008645457526417502,
370
- "loss": 0.1037,
371
- "step": 4700
372
- },
373
- {
374
- "epoch": 133.33,
375
- "learning_rate": 0.0008583440368728572,
376
- "loss": 0.1,
377
- "step": 4800
378
- },
379
- {
380
- "epoch": 136.11,
381
- "learning_rate": 0.0008520268396704223,
382
- "loss": 0.0967,
383
- "step": 4900
384
- },
385
- {
386
- "epoch": 138.89,
387
- "learning_rate": 0.0008455961968405809,
388
- "loss": 0.0942,
389
- "step": 5000
390
- },
391
- {
392
- "epoch": 138.89,
393
- "eval_loss": 0.5256752967834473,
394
- "eval_runtime": 133.1352,
395
- "eval_samples_per_second": 19.597,
396
- "eval_steps_per_second": 0.248,
397
- "eval_wer": 0.43748011454024816,
398
- "step": 5000
399
- },
400
- {
401
- "epoch": 141.67,
402
- "learning_rate": 0.0008390541807489265,
403
- "loss": 0.0987,
404
- "step": 5100
405
- },
406
- {
407
- "epoch": 144.44,
408
- "learning_rate": 0.0008324028996526611,
409
- "loss": 0.094,
410
- "step": 5200
411
- },
412
- {
413
- "epoch": 147.22,
414
- "learning_rate": 0.0008256444970211793,
415
- "loss": 0.0935,
416
- "step": 5300
417
- },
418
- {
419
- "epoch": 150.0,
420
- "learning_rate": 0.000818781150845306,
421
- "loss": 0.0906,
422
- "step": 5400
423
- },
424
- {
425
- "epoch": 152.78,
426
- "learning_rate": 0.0008118150729354068,
427
- "loss": 0.0909,
428
- "step": 5500
429
- },
430
- {
431
- "epoch": 152.78,
432
- "eval_loss": 0.5312919020652771,
433
- "eval_runtime": 133.5185,
434
- "eval_samples_per_second": 19.54,
435
- "eval_steps_per_second": 0.247,
436
- "eval_wer": 0.47133312122176263,
437
- "step": 5500
438
- },
439
- {
440
- "epoch": 155.56,
441
- "learning_rate": 0.0008047485082086017,
442
- "loss": 0.0881,
443
- "step": 5600
444
- },
445
- {
446
- "epoch": 158.33,
447
- "learning_rate": 0.0007975837339653084,
448
- "loss": 0.0921,
449
- "step": 5700
450
- },
451
- {
452
- "epoch": 161.11,
453
- "learning_rate": 0.0007903230591553503,
454
- "loss": 0.0838,
455
- "step": 5800
456
- },
457
- {
458
- "epoch": 163.89,
459
- "learning_rate": 0.0007829688236338643,
460
- "loss": 0.0775,
461
- "step": 5900
462
- },
463
- {
464
- "epoch": 166.67,
465
- "learning_rate": 0.0007755233974072504,
466
- "loss": 0.0807,
467
- "step": 6000
468
- },
469
- {
470
- "epoch": 166.67,
471
- "eval_loss": 0.5847254991531372,
472
- "eval_runtime": 133.1812,
473
- "eval_samples_per_second": 19.59,
474
- "eval_steps_per_second": 0.248,
475
- "eval_wer": 0.44708876869233216,
476
- "step": 6000
477
- },
478
- {
479
- "epoch": 169.44,
480
- "learning_rate": 0.0007679891798694021,
481
- "loss": 0.0801,
482
- "step": 6100
483
- },
484
- {
485
- "epoch": 172.22,
486
- "learning_rate": 0.000760368599028469,
487
- "loss": 0.0952,
488
- "step": 6200
489
- },
490
- {
491
- "epoch": 175.0,
492
- "learning_rate": 0.0007526641107243966,
493
- "loss": 0.0813,
494
- "step": 6300
495
- },
496
- {
497
- "epoch": 177.78,
498
- "learning_rate": 0.0007448781978374969,
499
- "loss": 0.0795,
500
- "step": 6400
501
- },
502
- {
503
- "epoch": 180.56,
504
- "learning_rate": 0.0007370133694883051,
505
- "loss": 0.0767,
506
- "step": 6500
507
- },
508
- {
509
- "epoch": 180.56,
510
- "eval_loss": 0.5318175554275513,
511
- "eval_runtime": 135.804,
512
- "eval_samples_per_second": 19.212,
513
- "eval_steps_per_second": 0.243,
514
- "eval_wer": 0.4534521158129176,
515
- "step": 6500
516
- },
517
- {
518
- "epoch": 183.33,
519
- "learning_rate": 0.0007290721602289801,
520
- "loss": 0.0762,
521
- "step": 6600
522
- },
523
- {
524
- "epoch": 186.11,
525
- "learning_rate": 0.0007210571292265096,
526
- "loss": 0.0729,
527
- "step": 6700
528
- },
529
- {
530
- "epoch": 188.89,
531
- "learning_rate": 0.0007129708594379816,
532
- "loss": 0.0751,
533
- "step": 6800
534
- },
535
- {
536
- "epoch": 191.67,
537
- "learning_rate": 0.0007048159567781905,
538
- "loss": 0.0743,
539
- "step": 6900
540
- },
541
- {
542
- "epoch": 194.44,
543
- "learning_rate": 0.0006965950492798443,
544
- "loss": 0.0729,
545
- "step": 7000
546
- },
547
- {
548
- "epoch": 194.44,
549
- "eval_loss": 0.5796982645988464,
550
- "eval_runtime": 132.2018,
551
- "eval_samples_per_second": 19.735,
552
- "eval_steps_per_second": 0.25,
553
- "eval_wer": 0.4584155265669742,
554
- "step": 7000
555
- },
556
- {
557
- "epoch": 197.22,
558
- "learning_rate": 0.0006883107862466433,
559
- "loss": 0.0791,
560
- "step": 7100
561
- },
562
- {
563
- "epoch": 200.0,
564
- "learning_rate": 0.0006799658373995054,
565
- "loss": 0.0737,
566
- "step": 7200
567
- },
568
- {
569
- "epoch": 202.78,
570
- "learning_rate": 0.0006715628920162093,
571
- "loss": 0.0694,
572
- "step": 7300
573
- },
574
- {
575
- "epoch": 205.56,
576
- "learning_rate": 0.0006631046580647384,
577
- "loss": 0.0687,
578
- "step": 7400
579
- },
580
- {
581
- "epoch": 208.33,
582
- "learning_rate": 0.0006545938613305993,
583
- "loss": 0.072,
584
- "step": 7500
585
- },
586
- {
587
- "epoch": 208.33,
588
- "eval_loss": 0.5266388654708862,
589
- "eval_runtime": 130.3709,
590
- "eval_samples_per_second": 20.012,
591
- "eval_steps_per_second": 0.253,
592
- "eval_wer": 0.44339802736239264,
593
- "step": 7500
594
- },
595
- {
596
- "epoch": 211.11,
597
- "learning_rate": 0.000646033244538398,
598
- "loss": 0.0647,
599
- "step": 7600
600
- },
601
- {
602
- "epoch": 213.89,
603
- "learning_rate": 0.000637425566467959,
604
- "loss": 0.0631,
605
- "step": 7700
606
- },
607
- {
608
- "epoch": 216.67,
609
- "learning_rate": 0.0006287736010652693,
610
- "loss": 0.0606,
611
- "step": 7800
612
- },
613
- {
614
- "epoch": 219.44,
615
- "learning_rate": 0.000620080136548535,
616
- "loss": 0.0645,
617
- "step": 7900
618
- },
619
- {
620
- "epoch": 222.22,
621
- "learning_rate": 0.0006113479745096386,
622
- "loss": 0.0593,
623
- "step": 8000
624
- },
625
- {
626
- "epoch": 222.22,
627
- "eval_loss": 0.579177737236023,
628
- "eval_runtime": 133.0716,
629
- "eval_samples_per_second": 19.606,
630
- "eval_steps_per_second": 0.248,
631
- "eval_wer": 0.43888005090677695,
632
- "step": 8000
633
- },
634
- {
635
- "epoch": 225.0,
636
- "learning_rate": 0.0006025799290112865,
637
- "loss": 0.0596,
638
- "step": 8100
639
- },
640
- {
641
- "epoch": 227.78,
642
- "learning_rate": 0.0005937788256801371,
643
- "loss": 0.0606,
644
- "step": 8200
645
- },
646
- {
647
- "epoch": 230.56,
648
- "learning_rate": 0.0005849475007962031,
649
- "loss": 0.0591,
650
- "step": 8300
651
- },
652
- {
653
- "epoch": 233.33,
654
- "learning_rate": 0.0005760888003788196,
655
- "loss": 0.0544,
656
- "step": 8400
657
- },
658
- {
659
- "epoch": 236.11,
660
- "learning_rate": 0.0005672055792694753,
661
- "loss": 0.0524,
662
- "step": 8500
663
- },
664
- {
665
- "epoch": 236.11,
666
- "eval_loss": 0.5740395784378052,
667
- "eval_runtime": 132.5642,
668
- "eval_samples_per_second": 19.681,
669
- "eval_steps_per_second": 0.249,
670
- "eval_wer": 0.43732103086223356,
671
- "step": 8500
672
- },
673
- {
674
- "epoch": 238.89,
675
- "learning_rate": 0.0005583007002117978,
676
- "loss": 0.0504,
677
- "step": 8600
678
- },
679
- {
680
- "epoch": 241.67,
681
- "learning_rate": 0.0005493770329289953,
682
- "loss": 0.0494,
683
- "step": 8700
684
- },
685
- {
686
- "epoch": 244.44,
687
- "learning_rate": 0.0005404374531990474,
688
- "loss": 0.0484,
689
- "step": 8800
690
- },
691
- {
692
- "epoch": 247.22,
693
- "learning_rate": 0.0005314848419279442,
694
- "loss": 0.0489,
695
- "step": 8900
696
- },
697
- {
698
- "epoch": 250.0,
699
- "learning_rate": 0.0005225220842212748,
700
- "loss": 0.0494,
701
- "step": 9000
702
- },
703
- {
704
- "epoch": 250.0,
705
- "eval_loss": 0.5520852208137512,
706
- "eval_runtime": 133.6258,
707
- "eval_samples_per_second": 19.525,
708
- "eval_steps_per_second": 0.247,
709
- "eval_wer": 0.44358892777601017,
710
- "step": 9000
711
- },
712
- {
713
- "epoch": 252.78,
714
- "learning_rate": 0.0005135520684544602,
715
- "loss": 0.0499,
716
- "step": 9100
717
- },
718
- {
719
- "epoch": 255.56,
720
- "learning_rate": 0.0005045776853419344,
721
- "loss": 0.0487,
722
- "step": 9200
723
- },
724
- {
725
- "epoch": 258.33,
726
- "learning_rate": 0.0004956018270055703,
727
- "loss": 0.0523,
728
- "step": 9300
729
- },
730
- {
731
- "epoch": 261.11,
732
- "learning_rate": 0.00048662738604265206,
733
- "loss": 0.0479,
734
- "step": 9400
735
- },
736
- {
737
- "epoch": 263.89,
738
- "learning_rate": 0.0004776572545936954,
739
- "loss": 0.0469,
740
- "step": 9500
741
- },
742
- {
743
- "epoch": 263.89,
744
- "eval_loss": 0.5630596876144409,
745
- "eval_runtime": 130.7272,
746
- "eval_samples_per_second": 19.958,
747
- "eval_steps_per_second": 0.252,
748
- "eval_wer": 0.4345847916003818,
749
- "step": 9500
750
- },
751
- {
752
- "epoch": 266.67,
753
- "learning_rate": 0.0004686943234104146,
754
- "loss": 0.0467,
755
- "step": 9600
756
- },
757
- {
758
- "epoch": 269.44,
759
- "learning_rate": 0.00045974148092413597,
760
- "loss": 0.0438,
761
- "step": 9700
762
- },
763
- {
764
- "epoch": 272.22,
765
- "learning_rate": 0.00045080161231496064,
766
- "loss": 0.0422,
767
- "step": 9800
768
- },
769
- {
770
- "epoch": 275.0,
771
- "learning_rate": 0.00044187759858197486,
772
- "loss": 0.042,
773
- "step": 9900
774
- },
775
- {
776
- "epoch": 277.78,
777
- "learning_rate": 0.0004329723156148063,
778
- "loss": 0.0417,
779
- "step": 10000
780
- },
781
- {
782
- "epoch": 277.78,
783
- "eval_loss": 0.5777372121810913,
784
- "eval_runtime": 130.7332,
785
- "eval_samples_per_second": 19.957,
786
- "eval_steps_per_second": 0.252,
787
- "eval_wer": 0.43057588291441296,
788
- "step": 10000
789
- },
790
- {
791
- "epoch": 280.56,
792
- "learning_rate": 0.0004240886332668285,
793
- "loss": 0.0406,
794
- "step": 10100
795
- },
796
- {
797
- "epoch": 283.33,
798
- "learning_rate": 0.00041522941443031025,
799
- "loss": 0.0385,
800
- "step": 10200
801
- },
802
- {
803
- "epoch": 286.11,
804
- "learning_rate": 0.0004063975141138074,
805
- "loss": 0.0384,
806
- "step": 10300
807
- },
808
- {
809
- "epoch": 288.89,
810
- "learning_rate": 0.00039759577852209704,
811
- "loss": 0.0369,
812
- "step": 10400
813
- },
814
- {
815
- "epoch": 291.67,
816
- "learning_rate": 0.0003888270441389465,
817
- "loss": 0.0379,
818
- "step": 10500
819
- },
820
- {
821
- "epoch": 291.67,
822
- "eval_loss": 0.5934527516365051,
823
- "eval_runtime": 131.6738,
824
- "eval_samples_per_second": 19.814,
825
- "eval_steps_per_second": 0.251,
826
- "eval_wer": 0.42828507795100224,
827
- "step": 10500
828
- },
829
- {
830
- "epoch": 294.44,
831
- "learning_rate": 0.0003800941368130171,
832
- "loss": 0.0399,
833
- "step": 10600
834
- },
835
- {
836
- "epoch": 297.22,
837
- "learning_rate": 0.0003713998708471946,
838
- "loss": 0.0359,
839
- "step": 10700
840
- },
841
- {
842
- "epoch": 300.0,
843
- "learning_rate": 0.0003627470480916394,
844
- "loss": 0.0345,
845
- "step": 10800
846
- },
847
- {
848
- "epoch": 302.78,
849
- "learning_rate": 0.00035413845704085215,
850
- "loss": 0.0346,
851
- "step": 10900
852
- },
853
- {
854
- "epoch": 305.56,
855
- "learning_rate": 0.00034557687193504045,
856
- "loss": 0.0319,
857
- "step": 11000
858
- },
859
- {
860
- "epoch": 305.56,
861
- "eval_loss": 0.5892442464828491,
862
- "eval_runtime": 130.692,
863
- "eval_samples_per_second": 19.963,
864
- "eval_steps_per_second": 0.253,
865
- "eval_wer": 0.41880369074132995,
866
- "step": 11000
867
- },
868
- {
869
- "epoch": 308.33,
870
- "learning_rate": 0.00033706505186608136,
871
- "loss": 0.0318,
872
- "step": 11100
873
- },
874
- {
875
- "epoch": 311.11,
876
- "learning_rate": 0.00032860573988836573,
877
- "loss": 0.0301,
878
- "step": 11200
879
- },
880
- {
881
- "epoch": 313.89,
882
- "learning_rate": 0.0003202016621348088,
883
- "loss": 0.0322,
884
- "step": 11300
885
- },
886
- {
887
- "epoch": 316.67,
888
- "learning_rate": 0.00031185552693831594,
889
- "loss": 0.0331,
890
- "step": 11400
891
- },
892
- {
893
- "epoch": 319.44,
894
- "learning_rate": 0.0003035700239589846,
895
- "loss": 0.0311,
896
- "step": 11500
897
- },
898
- {
899
- "epoch": 319.44,
900
- "eval_loss": 0.6010639071464539,
901
- "eval_runtime": 132.2371,
902
- "eval_samples_per_second": 19.73,
903
- "eval_steps_per_second": 0.25,
904
- "eval_wer": 0.4210626789691378,
905
- "step": 11500
906
- },
907
- {
908
- "epoch": 322.22,
909
- "learning_rate": 0.00029534782331732204,
910
- "loss": 0.0291,
911
- "step": 11600
912
- },
913
- {
914
- "epoch": 325.0,
915
- "learning_rate": 0.00028719157473376303,
916
- "loss": 0.0287,
917
- "step": 11700
918
- },
919
- {
920
- "epoch": 327.78,
921
- "learning_rate": 0.00027918443530500935,
922
- "loss": 0.0279,
923
- "step": 11800
924
- },
925
- {
926
- "epoch": 330.56,
927
- "learning_rate": 0.0002711672294401907,
928
- "loss": 0.0294,
929
- "step": 11900
930
- },
931
- {
932
- "epoch": 333.33,
933
- "learning_rate": 0.00026322376817181157,
934
- "loss": 0.0269,
935
- "step": 12000
936
- },
937
- {
938
- "epoch": 333.33,
939
- "eval_loss": 0.5972930192947388,
940
- "eval_runtime": 133.0245,
941
- "eval_samples_per_second": 19.613,
942
- "eval_steps_per_second": 0.248,
943
- "eval_wer": 0.4232262169901368,
944
- "step": 12000
945
- },
946
- {
947
- "epoch": 336.11,
948
- "learning_rate": 0.0002553566113926006,
949
- "loss": 0.0251,
950
- "step": 12100
951
- },
952
- {
953
- "epoch": 338.89,
954
- "learning_rate": 0.00024756829440508705,
955
- "loss": 0.0261,
956
- "step": 12200
957
- },
958
- {
959
- "epoch": 341.67,
960
- "learning_rate": 0.0002398613271045611,
961
- "loss": 0.025,
962
- "step": 12300
963
- },
964
- {
965
- "epoch": 344.44,
966
- "learning_rate": 0.00023223819317022654,
967
- "loss": 0.0264,
968
- "step": 12400
969
- },
970
- {
971
- "epoch": 347.22,
972
- "learning_rate": 0.00022470134926479935,
973
- "loss": 0.0271,
974
- "step": 12500
975
- },
976
- {
977
- "epoch": 347.22,
978
- "eval_loss": 0.6094068288803101,
979
- "eval_runtime": 132.9769,
980
- "eval_samples_per_second": 19.62,
981
- "eval_steps_per_second": 0.248,
982
- "eval_wer": 0.4428253261215399,
983
- "step": 12500
984
- },
985
- {
986
- "epoch": 350.0,
987
- "learning_rate": 0.00021725322424281286,
988
- "loss": 0.0246,
989
- "step": 12600
990
- },
991
- {
992
- "epoch": 352.78,
993
- "learning_rate": 0.00020989621836788614,
994
- "loss": 0.0245,
995
- "step": 12700
996
- },
997
- {
998
- "epoch": 355.56,
999
- "learning_rate": 0.00020263270253920428,
1000
- "loss": 0.0229,
1001
- "step": 12800
1002
- },
1003
- {
1004
- "epoch": 358.33,
1005
- "learning_rate": 0.00019546501752746288,
1006
- "loss": 0.0229,
1007
- "step": 12900
1008
- },
1009
- {
1010
- "epoch": 361.11,
1011
- "learning_rate": 0.0001883954732205217,
1012
- "loss": 0.0236,
1013
- "step": 13000
1014
- },
1015
- {
1016
- "epoch": 361.11,
1017
- "eval_loss": 0.611167311668396,
1018
- "eval_runtime": 132.3797,
1019
- "eval_samples_per_second": 19.708,
1020
- "eval_steps_per_second": 0.249,
1021
- "eval_wer": 0.42373528475978367,
1022
- "step": 13000
1023
- },
1024
- {
1025
- "epoch": 363.89,
1026
- "learning_rate": 0.00018142634787900996,
1027
- "loss": 0.0229,
1028
- "step": 13100
1029
- },
1030
- {
1031
- "epoch": 366.67,
1032
- "learning_rate": 0.00017455988740212576,
1033
- "loss": 0.0221,
1034
- "step": 13200
1035
- },
1036
- {
1037
- "epoch": 369.44,
1038
- "learning_rate": 0.0001677983046038624,
1039
- "loss": 0.0208,
1040
- "step": 13300
1041
- },
1042
- {
1043
- "epoch": 372.22,
1044
- "learning_rate": 0.00016114377849989813,
1045
- "loss": 0.0208,
1046
- "step": 13400
1047
- },
1048
- {
1049
- "epoch": 375.0,
1050
- "learning_rate": 0.00015459845360537756,
1051
- "loss": 0.0202,
1052
- "step": 13500
1053
- },
1054
- {
1055
- "epoch": 375.0,
1056
- "eval_loss": 0.605171799659729,
1057
- "eval_runtime": 132.1498,
1058
- "eval_samples_per_second": 19.743,
1059
- "eval_steps_per_second": 0.25,
1060
- "eval_wer": 0.4233534839325485,
1061
- "step": 13500
1062
- },
1063
- {
1064
- "epoch": 377.78,
1065
- "learning_rate": 0.0001481644392438113,
1066
- "loss": 0.0197,
1067
- "step": 13600
1068
- },
1069
- {
1070
- "epoch": 380.56,
1071
- "learning_rate": 0.00014184380886731607,
1072
- "loss": 0.0195,
1073
- "step": 13700
1074
- },
1075
- {
1076
- "epoch": 383.33,
1077
- "learning_rate": 0.0001356385993884165,
1078
- "loss": 0.0186,
1079
- "step": 13800
1080
- },
1081
- {
1082
- "epoch": 386.11,
1083
- "learning_rate": 0.00012955081052362072,
1084
- "loss": 0.0186,
1085
- "step": 13900
1086
- },
1087
- {
1088
- "epoch": 388.89,
1089
- "learning_rate": 0.00012358240414898276,
1090
- "loss": 0.0175,
1091
- "step": 14000
1092
- },
1093
- {
1094
- "epoch": 388.89,
1095
- "eval_loss": 0.631072998046875,
1096
- "eval_runtime": 131.5592,
1097
- "eval_samples_per_second": 19.831,
1098
- "eval_steps_per_second": 0.251,
1099
- "eval_wer": 0.4188673242125358,
1100
- "step": 14000
1101
- },
1102
- {
1103
- "epoch": 391.67,
1104
- "learning_rate": 0.00011773530366786184,
1105
- "loss": 0.0164,
1106
- "step": 14100
1107
- },
1108
- {
1109
- "epoch": 394.44,
1110
- "learning_rate": 0.0001120113933910767,
1111
- "loss": 0.0166,
1112
- "step": 14200
1113
- },
1114
- {
1115
- "epoch": 397.22,
1116
- "learning_rate": 0.000106412517929661,
1117
- "loss": 0.0163,
1118
- "step": 14300
1119
- },
1120
- {
1121
- "epoch": 400.0,
1122
- "learning_rate": 0.00010094048160041091,
1123
- "loss": 0.0159,
1124
- "step": 14400
1125
- },
1126
- {
1127
- "epoch": 402.78,
1128
- "learning_rate": 9.559704784441814e-05,
1129
- "loss": 0.0158,
1130
- "step": 14500
1131
- },
1132
- {
1133
- "epoch": 402.78,
1134
- "eval_loss": 0.618556797504425,
1135
- "eval_runtime": 132.4333,
1136
- "eval_samples_per_second": 19.7,
1137
- "eval_steps_per_second": 0.249,
1138
- "eval_wer": 0.4137130130448616,
1139
- "step": 14500
1140
- },
1141
- {
1142
- "epoch": 405.56,
1143
- "learning_rate": 9.038393865877726e-05,
1144
- "loss": 0.015,
1145
- "step": 14600
1146
- },
1147
- {
1148
- "epoch": 408.33,
1149
- "learning_rate": 8.530283404164612e-05,
1150
- "loss": 0.0156,
1151
- "step": 14700
1152
- },
1153
- {
1154
- "epoch": 411.11,
1155
- "learning_rate": 8.03553714508441e-05,
1156
- "loss": 0.0146,
1157
- "step": 14800
1158
- },
1159
- {
1160
- "epoch": 413.89,
1161
- "learning_rate": 7.554314527615763e-05,
1162
- "loss": 0.0146,
1163
- "step": 14900
1164
- },
1165
- {
1166
- "epoch": 416.67,
1167
- "learning_rate": 7.086770632552514e-05,
1168
- "loss": 0.0141,
1169
- "step": 15000
1170
- },
1171
- {
1172
- "epoch": 416.67,
1173
- "eval_loss": 0.6352781057357788,
1174
- "eval_runtime": 132.6132,
1175
- "eval_samples_per_second": 19.674,
1176
- "eval_steps_per_second": 0.249,
1177
- "eval_wer": 0.412249443207127,
1178
- "step": 15000
1179
- },
1180
- {
1181
- "epoch": 419.44,
1182
- "learning_rate": 6.633056132526849e-05,
1183
- "loss": 0.0138,
1184
- "step": 15100
1185
- },
1186
- {
1187
- "epoch": 422.22,
1188
- "learning_rate": 6.193317243452734e-05,
1189
- "loss": 0.0138,
1190
- "step": 15200
1191
- },
1192
- {
1193
- "epoch": 425.0,
1194
- "learning_rate": 5.7676956774059205e-05,
1195
- "loss": 0.0131,
1196
- "step": 15300
1197
- },
1198
- {
1199
- "epoch": 427.78,
1200
- "learning_rate": 5.356328596955179e-05,
1201
- "loss": 0.0131,
1202
- "step": 15400
1203
- },
1204
- {
1205
- "epoch": 430.56,
1206
- "learning_rate": 4.963246731369253e-05,
1207
- "loss": 0.013,
1208
- "step": 15500
1209
- },
1210
- {
1211
- "epoch": 430.56,
1212
- "eval_loss": 0.6343812942504883,
1213
- "eval_runtime": 131.5808,
1214
- "eval_samples_per_second": 19.828,
1215
- "eval_steps_per_second": 0.251,
1216
- "eval_wer": 0.40687241489023224,
1217
- "step": 15500
1218
- },
1219
- {
1220
- "epoch": 433.33,
1221
- "learning_rate": 4.580635924447718e-05,
1222
- "loss": 0.0127,
1223
- "step": 15600
1224
- },
1225
- {
1226
- "epoch": 436.11,
1227
- "learning_rate": 4.212662149914887e-05,
1228
- "loss": 0.0126,
1229
- "step": 15700
1230
- },
1231
- {
1232
- "epoch": 438.89,
1233
- "learning_rate": 3.859443992523443e-05,
1234
- "loss": 0.0125,
1235
- "step": 15800
1236
- },
1237
- {
1238
- "epoch": 441.67,
1239
- "learning_rate": 3.521095281819786e-05,
1240
- "loss": 0.0127,
1241
- "step": 15900
1242
- },
1243
- {
1244
- "epoch": 444.44,
1245
- "learning_rate": 3.1977250554608205e-05,
1246
- "loss": 0.0117,
1247
- "step": 16000
1248
- },
1249
- {
1250
- "epoch": 444.44,
1251
- "eval_loss": 0.6442536115646362,
1252
- "eval_runtime": 132.782,
1253
- "eval_samples_per_second": 19.649,
1254
- "eval_steps_per_second": 0.249,
1255
- "eval_wer": 0.40801781737193765,
1256
- "step": 16000
1257
- },
1258
- {
1259
- "epoch": 447.22,
1260
- "learning_rate": 2.8894375240750613e-05,
1261
- "loss": 0.0122,
1262
- "step": 16100
1263
- },
1264
- {
1265
- "epoch": 450.0,
1266
- "learning_rate": 2.5963320376792666e-05,
1267
- "loss": 0.0127,
1268
- "step": 16200
1269
- },
1270
- {
1271
- "epoch": 452.78,
1272
- "learning_rate": 2.318503053661475e-05,
1273
- "loss": 0.0125,
1274
- "step": 16300
1275
- },
1276
- {
1277
- "epoch": 455.56,
1278
- "learning_rate": 2.056040106340823e-05,
1279
- "loss": 0.0121,
1280
- "step": 16400
1281
- },
1282
- {
1283
- "epoch": 458.33,
1284
- "learning_rate": 1.809027778113803e-05,
1285
- "loss": 0.0122,
1286
- "step": 16500
1287
- },
1288
- {
1289
- "epoch": 458.33,
1290
- "eval_loss": 0.6512282490730286,
1291
- "eval_runtime": 133.1307,
1292
- "eval_samples_per_second": 19.597,
1293
- "eval_steps_per_second": 0.248,
1294
- "eval_wer": 0.4069360483614381,
1295
- "step": 16500
1296
- },
1297
- {
1298
- "epoch": 461.11,
1299
- "learning_rate": 1.5775456721964065e-05,
1300
- "loss": 0.0113,
1301
- "step": 16600
1302
- },
1303
- {
1304
- "epoch": 463.89,
1305
- "learning_rate": 1.3616683869708658e-05,
1306
- "loss": 0.0113,
1307
- "step": 16700
1308
- },
1309
- {
1310
- "epoch": 466.67,
1311
- "learning_rate": 1.1614654919452406e-05,
1312
- "loss": 0.0117,
1313
- "step": 16800
1314
- },
1315
- {
1316
- "epoch": 469.44,
1317
- "learning_rate": 9.770015053337078e-06,
1318
- "loss": 0.0112,
1319
- "step": 16900
1320
- },
1321
- {
1322
- "epoch": 472.22,
1323
- "learning_rate": 8.083358732646206e-06,
1324
- "loss": 0.0115,
1325
- "step": 17000
1326
- },
1327
- {
1328
- "epoch": 472.22,
1329
- "eval_loss": 0.6556624174118042,
1330
- "eval_runtime": 132.4623,
1331
- "eval_samples_per_second": 19.696,
1332
- "eval_steps_per_second": 0.249,
1333
- "eval_wer": 0.4069360483614381,
1334
- "step": 17000
1335
- },
1336
- {
1337
- "epoch": 475.0,
1338
- "learning_rate": 6.555229506231608e-06,
1339
- "loss": 0.0111,
1340
- "step": 17100
1341
- },
1342
- {
1343
- "epoch": 477.78,
1344
- "learning_rate": 5.186119835347169e-06,
1345
- "loss": 0.0118,
1346
- "step": 17200
1347
- },
1348
- {
1349
- "epoch": 480.56,
1350
- "learning_rate": 3.976470934946075e-06,
1351
- "loss": 0.0112,
1352
- "step": 17300
1353
- },
1354
- {
1355
- "epoch": 483.33,
1356
- "learning_rate": 2.92667263149321e-06,
1357
- "loss": 0.0117,
1358
- "step": 17400
1359
- },
1360
- {
1361
- "epoch": 486.11,
1362
- "learning_rate": 2.037063237338044e-06,
1363
- "loss": 0.0111,
1364
- "step": 17500
1365
- },
1366
- {
1367
- "epoch": 486.11,
1368
- "eval_loss": 0.6513079404830933,
1369
- "eval_runtime": 131.4726,
1370
- "eval_samples_per_second": 19.844,
1371
- "eval_steps_per_second": 0.251,
1372
- "eval_wer": 0.4059497295577474,
1373
- "step": 17500
1374
- },
1375
- {
1376
- "epoch": 488.89,
1377
- "learning_rate": 1.3144256109794418e-06,
1378
- "loss": 0.0109,
1379
- "step": 17600
1380
- },
1381
- {
1382
- "epoch": 491.67,
1383
- "learning_rate": 7.44394288673067e-07,
1384
- "loss": 0.0112,
1385
- "step": 17700
1386
- },
1387
- {
1388
- "epoch": 494.44,
1389
- "learning_rate": 3.352551457218578e-07,
1390
- "loss": 0.0113,
1391
- "step": 17800
1392
- },
1393
- {
1394
- "epoch": 497.22,
1395
- "learning_rate": 8.714003300058781e-08,
1396
- "loss": 0.011,
1397
- "step": 17900
1398
- },
1399
- {
1400
- "epoch": 500.0,
1401
- "learning_rate": 1.2890911316176812e-10,
1402
- "loss": 0.0113,
1403
- "step": 18000
1404
- },
1405
- {
1406
- "epoch": 500.0,
1407
- "eval_loss": 0.6521313190460205,
1408
- "eval_runtime": 132.4384,
1409
- "eval_samples_per_second": 19.7,
1410
- "eval_steps_per_second": 0.249,
1411
- "eval_wer": 0.40601336302895324,
1412
- "step": 18000
1413
- },
1414
- {
1415
- "epoch": 500.0,
1416
- "step": 18000,
1417
- "total_flos": 5.3110650126518e+20,
1418
- "train_loss": 0.11533763631184896,
1419
- "train_runtime": 176050.2174,
1420
- "train_samples_per_second": 16.203,
1421
- "train_steps_per_second": 0.102
1422
- }
1423
- ],
1424
- "max_steps": 18000,
1425
- "num_train_epochs": 500,
1426
- "total_flos": 5.3110650126518e+20,
1427
- "trial_name": null,
1428
- "trial_params": null
1429
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9be3a7c88f8500cf6b3a8b0b089125768d465147886310e4abb4ddc8cf154dd1
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020e62b69669cb5205d10821c92f57fc9ddfd0706b2f7dd41539b83bb4d40ffb
3
  size 3055
wandb/debug-internal.log CHANGED
@@ -1 +1 @@
1
- run-20220126_121554-295enqix/logs/debug-internal.log
 
1
+ run-20220129_111936-33z1cg4n/logs/debug-internal.log
wandb/debug.log CHANGED
@@ -1 +1 @@
1
- run-20220126_121554-295enqix/logs/debug.log
 
1
+ run-20220129_111936-33z1cg4n/logs/debug.log
wandb/latest-run CHANGED
@@ -1 +1 @@
1
- run-20220126_121554-295enqix
 
1
+ run-20220129_111936-33z1cg4n
wandb/run-20220126_105847-1xdiy2kf/files/config.yaml CHANGED
@@ -4829,7 +4829,13 @@ _wandb:
4829
  - 1
4830
  - 5
4831
  - 11
 
 
 
 
4832
  3:
 
 
4833
  - 13
4834
  4: 3.9.6
4835
  5: 0.12.9
 
4829
  - 1
4830
  - 5
4831
  - 11
4832
+ 2:
4833
+ - 1
4834
+ - 5
4835
+ - 11
4836
  3:
4837
+ - 1
4838
+ - 7
4839
  - 13
4840
  4: 3.9.6
4841
  5: 0.12.9
wandb/run-20220126_105847-1xdiy2kf/files/output.log CHANGED
@@ -19602,3 +19602,87 @@ Configuration saved in ./config.json.78s/it]our model on huggingface.co/models =
19602
  97% 32/33 [02:06<00:03, 3.19s/it]tion set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19603
  Configuration saved in ./config.jsonion set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19604
  Configuration saved in ./preprocessor_config.jsont have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19602
  97% 32/33 [02:06<00:03, 3.19s/it]tion set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19603
  Configuration saved in ./config.jsonion set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19604
  Configuration saved in ./preprocessor_config.jsont have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19605
+ Configuration saved in ./preprocessor_config.jsont have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19606
+ ***** eval metrics *****
19607
+ epoch = 500.0
19608
+ eval_loss = 0.6521
19609
+ eval_runtime = 0:02:14.01
19610
+ eval_samples = 2609
19611
+ eval_samples_per_second = 19.468
19612
+ eval_steps_per_second = 0.246
19613
+ eval_wer = 0.406
19614
+ 01/28/2022 11:55:40 - WARNING - huggingface_hub.repository - Several commits (2) will be pushed upstream.
19615
+ The progress bars may be unreliable.pstream..jsont have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19616
+ Upload file wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb: 0% 32.0k/119M [00:00<?, ?B/s]C.forward` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19617
+ Upload file pytorch_model.bin: 2% 28.1M/1.18G [00:02<01:18, 15.6MB/s] 8.50M/119M [00:02<00:24, 4.82MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19618
+ Upload file pytorch_model.bin: 5% 57.1M/1.18G [00:04<01:20, 15.0MB/s] 24.0M/119M [00:04<00:14, 6.99MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19619
+ Upload file wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb: 32% 38.4M/119M [00:06<00:11, 7.24MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19620
+ Upload file pytorch_model.bin: 8% 93.5M/1.18G [00:08<01:51, 10.4MB/s] 51.2M/119M [00:08<00:10, 6.92MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19621
+ Upload file pytorch_model.bin: 9% 113M/1.18G [00:10<01:51, 10.2MB/s]% 65.4M/119M [00:10<00:07, 7.15MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19622
+ Upload file wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb: 67% 79.8M/119M [00:12<00:05, 7.37MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19623
+ Upload file pytorch_model.bin: 12% 147M/1.18G [00:14<01:59, 9.24MB/s]% 93.9M/119M [00:14<00:03, 7.41MB/s]d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19624
+ Upload file wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb: 92% 109M/119M [00:16<00:01, 7.64MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19625
+ Upload file pytorch_model.bin: 15% 183M/1.18G [00:18<01:56, 9.22MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19626
+ Upload file pytorch_model.bin: 17% 202M/1.18G [00:20<01:46, 9.81MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19627
+ Upload file pytorch_model.bin: 18% 220M/1.18G [00:22<01:46, 9.67MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19628
+ Upload file pytorch_model.bin: 20% 241M/1.18G [00:24<01:39, 10.2MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19629
+ Upload file pytorch_model.bin: 22% 262M/1.18G [00:26<01:32, 10.6MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19630
+ Upload file pytorch_model.bin: 23% 274M/1.18G [00:27<01:28, 11.0MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19631
+ Upload file pytorch_model.bin: 24% 295M/1.18G [00:29<01:25, 11.2MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19632
+ Upload file pytorch_model.bin: 26% 310M/1.18G [00:31<01:36, 9.67MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19633
+ Upload file pytorch_model.bin: 27% 323M/1.18G [00:33<01:52, 8.18MB/s]% 118M/119M [00:17<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19634
+ Upload file wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb: 100% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19635
+ Upload file pytorch_model.bin: 29% 353M/1.18G [00:37<01:55, 7.75MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19636
+ Upload file pytorch_model.bin: 31% 369M/1.18G [00:39<01:48, 8.06MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19637
+ Upload file pytorch_model.bin: 32% 384M/1.18G [00:41<01:46, 8.03MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19638
+ Upload file pytorch_model.bin: 33% 401M/1.18G [00:43<01:38, 8.55MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19639
+ Upload file pytorch_model.bin: 35% 423M/1.18G [00:45<01:21, 10.1MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19640
+ Upload file pytorch_model.bin: 37% 449M/1.18G [00:47<01:06, 11.9MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19641
+ Upload file pytorch_model.bin: 40% 486M/1.18G [00:49<00:47, 16.0MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19642
+ Upload file pytorch_model.bin: 44% 536M/1.18G [00:51<00:33, 21.0MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19643
+ Upload file pytorch_model.bin: 47% 571M/1.18G [00:53<00:33, 19.5MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19644
+ Upload file pytorch_model.bin: 50% 604M/1.18G [00:55<00:33, 18.6MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19645
+ Upload file pytorch_model.bin: 53% 634M/1.18G [00:57<00:35, 16.9MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19646
+ Upload file pytorch_model.bin: 55% 657M/1.18G [00:59<00:40, 14.1MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19647
+ Upload file pytorch_model.bin: 56% 680M/1.18G [01:01<00:41, 13.1MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19648
+ Upload file pytorch_model.bin: 58% 703M/1.18G [01:03<00:41, 12.7MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19649
+ Upload file pytorch_model.bin: 60% 720M/1.18G [01:05<00:48, 10.6MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19650
+ Upload file pytorch_model.bin: 61% 734M/1.18G [01:07<00:53, 9.22MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19651
+ Upload file pytorch_model.bin: 62% 750M/1.18G [01:09<00:55, 8.57MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19652
+ Upload file pytorch_model.bin: 63% 763M/1.18G [01:11<00:59, 7.72MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19653
+ Upload file pytorch_model.bin: 64% 776M/1.18G [01:13<01:01, 7.33MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19654
+ Upload file pytorch_model.bin: 66% 791M/1.18G [01:15<00:57, 7.53MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19655
+ Upload file pytorch_model.bin: 67% 806M/1.18G [01:17<00:53, 7.79MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19656
+ Upload file pytorch_model.bin: 68% 823M/1.18G [01:19<00:49, 8.14MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19657
+ Upload file pytorch_model.bin: 70% 839M/1.18G [01:21<00:46, 8.17MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19658
+ Upload file pytorch_model.bin: 71% 855M/1.18G [01:23<00:43, 8.46MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19659
+ Upload file pytorch_model.bin: 72% 866M/1.18G [01:25<00:50, 7.01MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19660
+ Upload file pytorch_model.bin: 73% 876M/1.18G [01:27<00:54, 6.27MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19661
+ Upload file pytorch_model.bin: 74% 887M/1.18G [01:29<00:55, 5.99MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19662
+ Upload file pytorch_model.bin: 75% 898M/1.18G [01:31<00:54, 5.83MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19663
+ Upload file pytorch_model.bin: 76% 910M/1.18G [01:33<00:50, 6.15MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19664
+ Upload file pytorch_model.bin: 77% 924M/1.18G [01:35<00:44, 6.65MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19665
+ Upload file pytorch_model.bin: 78% 940M/1.18G [01:37<00:36, 7.67MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19666
+ Upload file pytorch_model.bin: 79% 956M/1.18G [01:39<00:32, 8.00MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19667
+ Upload file pytorch_model.bin: 81% 975M/1.18G [01:41<00:26, 8.90MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19668
+ Upload file pytorch_model.bin: 83% 993M/1.18G [01:43<00:23, 9.37MB/s]% 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19669
+ Upload file pytorch_model.bin: 84% 0.98G/1.18G [01:45<00:24, 8.35MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19670
+ Upload file pytorch_model.bin: 84% 0.99G/1.18G [01:47<00:31, 6.20MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19671
+ Upload file pytorch_model.bin: 85% 1.00G/1.18G [01:49<00:32, 5.83MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19672
+ Upload file pytorch_model.bin: 86% 1.01G/1.18G [01:51<00:34, 5.21MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19673
+ Upload file pytorch_model.bin: 87% 1.02G/1.18G [01:53<00:33, 4.98MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19674
+ Upload file pytorch_model.bin: 88% 1.03G/1.18G [01:55<00:28, 5.46MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19675
+ Upload file pytorch_model.bin: 89% 1.04G/1.18G [01:57<00:24, 5.87MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19676
+ Upload file pytorch_model.bin: 90% 1.06G/1.18G [01:59<00:16, 7.62MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19677
+ Upload file pytorch_model.bin: 92% 1.08G/1.18G [02:01<00:09, 10.5MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19678
+ Upload file pytorch_model.bin: 95% 1.12G/1.18G [02:03<00:04, 14.5MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19679
+ Upload file pytorch_model.bin: 98% 1.15G/1.18G [02:05<00:01, 15.2MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19680
+ Upload file pytorch_model.bin: 99% 1.16G/1.18G [02:07<00:00, 12.1MB/s] 119M/119M [00:35<00:00, 8.20MB/s] d` and have been ignored: input_length.orward` and have been ignored: input_length.h..
19681
+ error: failed to push some refs to 'https://huggingface.co/shpotes/xls-r-et'e: error: cannot lock ref 'refs/heads/main': is at fa2a9d24f0bae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
19682
+ error: failed to push some refs to 'https://huggingface.co/shpotes/xls-r-et'e: error: cannot lock ref 'refs/heads/main': is at fa2a9d24f0bae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
19683
+ 01/28/2022 11:57:53 - WARNING - huggingface_hub.repository - remote: error: cannot lock ref 'refs/heads/main': is at fa2a9d24f0bae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
19684
+ To https://huggingface.co/shpotes/xls-r-et
19685
+ ! [remote rejected] main -> main (failed to update ref)
19686
+ error: failed to push some refs to 'https://huggingface.co/shpotes/xls-r-et'ae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724 but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
19687
+ error: failed to push some refs to 'https://huggingface.co/shpotes/xls-r-et'ae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724 but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
19688
+ error: failed to push some refs to 'https://huggingface.co/shpotes/xls-r-et'ae1b5002fb327d3cfa727ef5b4caf but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724 but expected 47349e7afe3432bdda0b555d40b9efb3c7b25724
wandb/run-20220126_105847-1xdiy2kf/files/wandb-summary.json CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220126_105847-1xdiy2kf/logs/debug-internal.log CHANGED
@@ -50347,3 +50347,216 @@ requests.exceptions.ReadTimeout: HTTPSConnectionPool(host='api.wandb.ai', port=4
50347
  2022-01-28 11:55:23,950 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50348
  2022-01-28 11:55:25,861 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50349
  2022-01-28 11:55:34,430 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50347
  2022-01-28 11:55:23,950 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50348
  2022-01-28 11:55:25,861 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50349
  2022-01-28 11:55:34,430 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50350
+ 2022-01-28 11:55:39,097 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50351
+ 2022-01-28 11:55:39,097 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50352
+ 2022-01-28 11:55:41,869 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50353
+ 2022-01-28 11:55:43,870 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50354
+ 2022-01-28 11:55:45,871 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50355
+ 2022-01-28 11:55:47,872 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50356
+ 2022-01-28 11:55:49,873 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50357
+ 2022-01-28 11:55:51,874 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50358
+ 2022-01-28 11:55:53,875 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50359
+ 2022-01-28 11:55:54,268 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50360
+ 2022-01-28 11:55:54,268 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50361
+ 2022-01-28 11:55:55,876 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50362
+ 2022-01-28 11:55:57,877 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50363
+ 2022-01-28 11:55:59,878 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50364
+ 2022-01-28 11:56:01,879 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50365
+ 2022-01-28 11:56:03,880 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50366
+ 2022-01-28 11:56:05,447 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50367
+ 2022-01-28 11:56:05,881 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50368
+ 2022-01-28 11:56:07,882 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50369
+ 2022-01-28 11:56:09,422 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50370
+ 2022-01-28 11:56:09,423 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50371
+ 2022-01-28 11:56:09,883 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50372
+ 2022-01-28 11:56:11,884 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50373
+ 2022-01-28 11:56:14,885 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50374
+ 2022-01-28 11:56:16,886 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50375
+ 2022-01-28 11:56:18,887 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50376
+ 2022-01-28 11:56:20,889 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50377
+ 2022-01-28 11:56:22,889 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50378
+ 2022-01-28 11:56:24,576 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50379
+ 2022-01-28 11:56:24,576 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50380
+ 2022-01-28 11:56:24,891 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50381
+ 2022-01-28 11:56:26,891 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50382
+ 2022-01-28 11:56:28,892 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50383
+ 2022-01-28 11:56:30,893 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50384
+ 2022-01-28 11:56:32,894 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50385
+ 2022-01-28 11:56:34,895 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50386
+ 2022-01-28 11:56:36,472 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50387
+ 2022-01-28 11:56:36,896 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50388
+ 2022-01-28 11:56:38,897 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50389
+ 2022-01-28 11:56:39,736 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50390
+ 2022-01-28 11:56:39,736 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50391
+ 2022-01-28 11:56:40,898 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50392
+ 2022-01-28 11:56:42,899 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50393
+ 2022-01-28 11:56:44,900 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50394
+ 2022-01-28 11:56:46,900 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50395
+ 2022-01-28 11:56:48,901 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50396
+ 2022-01-28 11:56:50,902 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50397
+ 2022-01-28 11:56:52,903 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50398
+ 2022-01-28 11:56:54,904 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50399
+ 2022-01-28 11:56:55,520 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50400
+ 2022-01-28 11:56:55,520 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50401
+ 2022-01-28 11:56:56,905 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50402
+ 2022-01-28 11:56:58,906 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50403
+ 2022-01-28 11:57:00,907 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50404
+ 2022-01-28 11:57:02,908 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50405
+ 2022-01-28 11:57:04,909 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50406
+ 2022-01-28 11:57:06,910 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50407
+ 2022-01-28 11:57:07,469 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50408
+ 2022-01-28 11:57:08,911 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50409
+ 2022-01-28 11:57:10,670 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50410
+ 2022-01-28 11:57:10,671 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50411
+ 2022-01-28 11:57:10,912 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50412
+ 2022-01-28 11:57:12,913 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50413
+ 2022-01-28 11:57:14,914 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50414
+ 2022-01-28 11:57:16,915 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50415
+ 2022-01-28 11:57:18,916 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50416
+ 2022-01-28 11:57:20,917 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50417
+ 2022-01-28 11:57:22,917 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50418
+ 2022-01-28 11:57:24,919 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50419
+ 2022-01-28 11:57:25,823 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50420
+ 2022-01-28 11:57:25,823 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50421
+ 2022-01-28 11:57:26,920 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50422
+ 2022-01-28 11:57:28,920 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50423
+ 2022-01-28 11:57:30,921 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50424
+ 2022-01-28 11:57:32,922 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50425
+ 2022-01-28 11:57:34,923 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50426
+ 2022-01-28 11:57:36,924 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50427
+ 2022-01-28 11:57:38,484 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50428
+ 2022-01-28 11:57:38,925 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50429
+ 2022-01-28 11:57:40,926 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50430
+ 2022-01-28 11:57:40,973 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: stop_status
50431
+ 2022-01-28 11:57:40,973 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: stop_status
50432
+ 2022-01-28 11:57:42,927 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50433
+ 2022-01-28 11:57:44,928 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50434
+ 2022-01-28 11:57:46,929 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50435
+ 2022-01-28 11:57:48,930 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50436
+ 2022-01-28 11:57:50,931 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50437
+ 2022-01-28 11:57:52,931 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50438
+ 2022-01-28 11:57:54,933 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50439
+ 2022-01-28 11:57:55,933 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50440
+ 2022-01-28 11:57:56,247 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50441
+ 2022-01-28 11:57:56,248 DEBUG SenderThread:2220828 [sender.py:send():234] send: telemetry
50442
+ 2022-01-28 11:57:56,248 DEBUG SenderThread:2220828 [sender.py:send():234] send: exit
50443
+ 2022-01-28 11:57:56,248 INFO SenderThread:2220828 [sender.py:send_exit():366] handling exit code: 1
50444
+ 2022-01-28 11:57:56,249 INFO SenderThread:2220828 [sender.py:send_exit():368] handling runtime: 176347
50445
+ 2022-01-28 11:57:56,276 INFO SenderThread:2220828 [sender.py:_save_file():939] saving file wandb-summary.json with policy end
50446
+ 2022-01-28 11:57:56,277 INFO SenderThread:2220828 [sender.py:send_exit():374] send defer
50447
+ 2022-01-28 11:57:56,277 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50448
+ 2022-01-28 11:57:56,278 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50449
+ 2022-01-28 11:57:56,278 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 0
50450
+ 2022-01-28 11:57:56,278 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50451
+ 2022-01-28 11:57:56,278 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 0
50452
+ 2022-01-28 11:57:56,278 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 1
50453
+ 2022-01-28 11:57:56,279 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50454
+ 2022-01-28 11:57:56,279 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 1
50455
+ 2022-01-28 11:57:56,432 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50456
+ 2022-01-28 11:57:56,432 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50457
+ 2022-01-28 11:57:56,432 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 1
50458
+ 2022-01-28 11:57:56,433 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 2
50459
+ 2022-01-28 11:57:56,433 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50460
+ 2022-01-28 11:57:56,434 DEBUG SenderThread:2220828 [sender.py:send():234] send: stats
50461
+ 2022-01-28 11:57:56,435 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50462
+ 2022-01-28 11:57:56,435 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 2
50463
+ 2022-01-28 11:57:56,435 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50464
+ 2022-01-28 11:57:56,436 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 2
50465
+ 2022-01-28 11:57:56,436 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 3
50466
+ 2022-01-28 11:57:56,436 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50467
+ 2022-01-28 11:57:56,436 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 3
50468
+ 2022-01-28 11:57:56,463 DEBUG SenderThread:2220828 [sender.py:send():234] send: summary
50469
+ 2022-01-28 11:57:56,500 INFO SenderThread:2220828 [sender.py:_save_file():939] saving file wandb-summary.json with policy end
50470
+ 2022-01-28 11:57:56,500 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50471
+ 2022-01-28 11:57:56,500 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 3
50472
+ 2022-01-28 11:57:56,500 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 4
50473
+ 2022-01-28 11:57:56,500 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50474
+ 2022-01-28 11:57:56,501 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 4
50475
+ 2022-01-28 11:57:56,501 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50476
+ 2022-01-28 11:57:56,501 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 4
50477
+ 2022-01-28 11:57:56,536 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50478
+ 2022-01-28 11:57:56,985 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50479
+ 2022-01-28 11:57:56,996 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/wandb-summary.json
50480
+ 2022-01-28 11:57:57,060 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 5
50481
+ 2022-01-28 11:57:57,060 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50482
+ 2022-01-28 11:57:57,061 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50483
+ 2022-01-28 11:57:57,061 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 5
50484
+ 2022-01-28 11:57:57,061 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50485
+ 2022-01-28 11:57:57,061 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 5
50486
+ 2022-01-28 11:57:57,061 INFO SenderThread:2220828 [dir_watcher.py:finish():283] shutting down directory watcher
50487
+ 2022-01-28 11:57:57,162 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50488
+ 2022-01-28 11:57:57,986 INFO Thread-8 :2220828 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/config.yaml
50489
+ 2022-01-28 11:57:57,987 INFO SenderThread:2220828 [dir_watcher.py:finish():313] scan: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files
50490
+ 2022-01-28 11:57:57,987 INFO SenderThread:2220828 [dir_watcher.py:finish():327] scan save: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/config.yaml config.yaml
50491
+ 2022-01-28 11:57:57,987 INFO SenderThread:2220828 [dir_watcher.py:finish():327] scan save: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/wandb-summary.json wandb-summary.json
50492
+ 2022-01-28 11:57:57,988 INFO SenderThread:2220828 [dir_watcher.py:finish():327] scan save: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/requirements.txt requirements.txt
50493
+ 2022-01-28 11:57:57,995 INFO SenderThread:2220828 [dir_watcher.py:finish():327] scan save: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/wandb-metadata.json wandb-metadata.json
50494
+ 2022-01-28 11:57:58,000 INFO SenderThread:2220828 [dir_watcher.py:finish():327] scan save: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log output.log
50495
+ 2022-01-28 11:57:58,000 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 6
50496
+ 2022-01-28 11:57:58,001 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50497
+ 2022-01-28 11:57:58,008 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50498
+ 2022-01-28 11:57:58,014 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 6
50499
+ 2022-01-28 11:57:58,014 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50500
+ 2022-01-28 11:57:58,015 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 6
50501
+ 2022-01-28 11:57:58,015 INFO SenderThread:2220828 [file_pusher.py:finish():177] shutting down file pusher
50502
+ 2022-01-28 11:57:58,104 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50503
+ 2022-01-28 11:57:58,104 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50504
+ 2022-01-28 11:57:58,207 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50505
+ 2022-01-28 11:57:58,207 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50506
+ 2022-01-28 11:57:58,309 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50507
+ 2022-01-28 11:57:58,310 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50508
+ 2022-01-28 11:57:58,412 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50509
+ 2022-01-28 11:57:58,413 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50510
+ 2022-01-28 11:57:58,515 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50511
+ 2022-01-28 11:57:58,515 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50512
+ 2022-01-28 11:57:58,618 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50513
+ 2022-01-28 11:57:58,618 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50514
+ 2022-01-28 11:57:58,630 INFO Thread-14 :2220828 [upload_job.py:push():137] Uploaded file /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/requirements.txt
50515
+ 2022-01-28 11:57:58,720 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50516
+ 2022-01-28 11:57:58,721 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50517
+ 2022-01-28 11:57:58,823 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50518
+ 2022-01-28 11:57:58,823 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50519
+ 2022-01-28 11:57:58,926 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50520
+ 2022-01-28 11:57:58,926 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50521
+ 2022-01-28 11:57:58,959 INFO Thread-13 :2220828 [upload_job.py:push():137] Uploaded file /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/wandb-summary.json
50522
+ 2022-01-28 11:57:59,017 INFO Thread-12 :2220828 [upload_job.py:push():137] Uploaded file /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/config.yaml
50523
+ 2022-01-28 11:57:59,029 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50524
+ 2022-01-28 11:57:59,029 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50525
+ 2022-01-28 11:57:59,131 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50526
+ 2022-01-28 11:57:59,132 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50527
+ 2022-01-28 11:57:59,170 INFO Thread-15 :2220828 [upload_job.py:push():137] Uploaded file /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/files/output.log
50528
+ 2022-01-28 11:57:59,234 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50529
+ 2022-01-28 11:57:59,234 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50530
+ 2022-01-28 11:57:59,337 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50531
+ 2022-01-28 11:57:59,337 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50532
+ 2022-01-28 11:57:59,371 INFO Thread-7 :2220828 [sender.py:transition_state():387] send defer: 7
50533
+ 2022-01-28 11:57:59,371 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50534
+ 2022-01-28 11:57:59,372 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 7
50535
+ 2022-01-28 11:57:59,372 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50536
+ 2022-01-28 11:57:59,372 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 7
50537
+ 2022-01-28 11:57:59,439 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50538
+ 2022-01-28 11:58:00,216 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 8
50539
+ 2022-01-28 11:58:00,217 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50540
+ 2022-01-28 11:58:00,217 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50541
+ 2022-01-28 11:58:00,218 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 8
50542
+ 2022-01-28 11:58:00,218 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50543
+ 2022-01-28 11:58:00,218 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 8
50544
+ 2022-01-28 11:58:00,218 INFO SenderThread:2220828 [sender.py:transition_state():387] send defer: 9
50545
+ 2022-01-28 11:58:00,220 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: defer
50546
+ 2022-01-28 11:58:00,220 DEBUG SenderThread:2220828 [sender.py:send():234] send: final
50547
+ 2022-01-28 11:58:00,221 INFO HandlerThread:2220828 [handler.py:handle_request_defer():147] handle defer: 9
50548
+ 2022-01-28 11:58:00,221 DEBUG SenderThread:2220828 [sender.py:send():234] send: footer
50549
+ 2022-01-28 11:58:00,222 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: defer
50550
+ 2022-01-28 11:58:00,222 INFO SenderThread:2220828 [sender.py:send_request_defer():383] handle sender defer: 9
50551
+ 2022-01-28 11:58:00,320 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: poll_exit
50552
+ 2022-01-28 11:58:00,320 DEBUG SenderThread:2220828 [sender.py:send_request():248] send_request: poll_exit
50553
+ 2022-01-28 11:58:00,320 INFO SenderThread:2220828 [file_pusher.py:join():182] waiting for file pusher
50554
+ 2022-01-28 11:58:00,599 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: get_summary
50555
+ 2022-01-28 11:58:00,657 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: sampled_history
50556
+ 2022-01-28 11:58:00,662 DEBUG HandlerThread:2220828 [handler.py:handle_request():130] handle_request: shutdown
50557
+ 2022-01-28 11:58:00,663 INFO HandlerThread:2220828 [handler.py:finish():731] shutting down handler
50558
+ 2022-01-28 11:58:01,221 INFO WriterThread:2220828 [datastore.py:close():281] close: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb
50559
+ 2022-01-28 11:58:01,597 INFO SenderThread:2220828 [sender.py:finish():1070] shutting down sender
50560
+ 2022-01-28 11:58:01,597 INFO SenderThread:2220828 [file_pusher.py:finish():177] shutting down file pusher
50561
+ 2022-01-28 11:58:01,597 INFO SenderThread:2220828 [file_pusher.py:join():182] waiting for file pusher
50562
+ 2022-01-28 11:58:01,606 INFO MainThread:2220828 [internal.py:handle_exit():77] Internal process exited
wandb/run-20220126_105847-1xdiy2kf/logs/debug.log CHANGED
@@ -22,3 +22,165 @@ config: {}
22
  2022-01-26 10:58:48,541 INFO MainThread:2220463 [wandb_init.py:init():633] run started, returning control to user process
23
  2022-01-26 10:58:48,562 INFO MainThread:2220463 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 36, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 39, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.1, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.0, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 80, 'per_device_eval_batch_size': 80, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 0.0003, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 500.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'warmup_ratio': 0.0, 'warmup_steps': 500, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan26_10-56-56_ganymede.eafit.edu.co', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 1, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': 'cosine+drop_proj+low_specaugment-300M', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 80, 'eval_batch_size': 80}
24
  2022-01-26 10:58:48,565 INFO MainThread:2220463 [wandb_watch.py:watch():43] Watching
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  2022-01-26 10:58:48,541 INFO MainThread:2220463 [wandb_init.py:init():633] run started, returning control to user process
23
  2022-01-26 10:58:48,562 INFO MainThread:2220463 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 36, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 39, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.1, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.0, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 80, 'per_device_eval_batch_size': 80, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 0.0003, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 500.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'warmup_ratio': 0.0, 'warmup_steps': 500, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan26_10-56-56_ganymede.eafit.edu.co', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 1, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': 'cosine+drop_proj+low_specaugment-300M', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 80, 'eval_batch_size': 80}
24
  2022-01-26 10:58:48,565 INFO MainThread:2220463 [wandb_watch.py:watch():43] Watching
25
+ 2022-01-28 11:57:53,891 INFO MainThread:2220463 [wandb_run.py:_atexit_cleanup():1780] got exitcode: 1
26
+ 2022-01-28 11:57:53,896 INFO MainThread:2220463 [wandb_run.py:_restore():1752] restore
27
+ 2022-01-28 11:57:56,278 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
28
+ wandb_count: 1
29
+ }
30
+ pusher_stats {
31
+ uploaded_bytes: 2324
32
+ total_bytes: 2324
33
+ }
34
+
35
+ 2022-01-28 11:57:56,435 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
36
+ wandb_count: 1
37
+ }
38
+ pusher_stats {
39
+ uploaded_bytes: 2324
40
+ total_bytes: 2324
41
+ }
42
+
43
+ 2022-01-28 11:57:57,061 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
44
+ wandb_count: 1
45
+ }
46
+ pusher_stats {
47
+ uploaded_bytes: 2324
48
+ total_bytes: 2324
49
+ }
50
+
51
+ 2022-01-28 11:57:58,002 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
52
+ wandb_count: 5
53
+ }
54
+ pusher_stats {
55
+ uploaded_bytes: 2324
56
+ total_bytes: 3441922
57
+ }
58
+
59
+ 2022-01-28 11:57:58,105 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
60
+ wandb_count: 5
61
+ }
62
+ pusher_stats {
63
+ uploaded_bytes: 2324
64
+ total_bytes: 3441922
65
+ }
66
+
67
+ 2022-01-28 11:57:58,208 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
68
+ wandb_count: 5
69
+ }
70
+ pusher_stats {
71
+ uploaded_bytes: 2324
72
+ total_bytes: 3441922
73
+ }
74
+
75
+ 2022-01-28 11:57:58,311 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
76
+ wandb_count: 5
77
+ }
78
+ pusher_stats {
79
+ uploaded_bytes: 2246495
80
+ total_bytes: 3441922
81
+ }
82
+
83
+ 2022-01-28 11:57:58,414 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
84
+ wandb_count: 5
85
+ }
86
+ pusher_stats {
87
+ uploaded_bytes: 2246495
88
+ total_bytes: 3441922
89
+ }
90
+
91
+ 2022-01-28 11:57:58,516 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
92
+ wandb_count: 5
93
+ }
94
+ pusher_stats {
95
+ uploaded_bytes: 3441922
96
+ total_bytes: 3441922
97
+ }
98
+
99
+ 2022-01-28 11:57:58,619 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
100
+ wandb_count: 5
101
+ }
102
+ pusher_stats {
103
+ uploaded_bytes: 3441922
104
+ total_bytes: 3441922
105
+ }
106
+
107
+ 2022-01-28 11:57:58,722 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
108
+ wandb_count: 5
109
+ }
110
+ pusher_stats {
111
+ uploaded_bytes: 3441922
112
+ total_bytes: 3441922
113
+ }
114
+
115
+ 2022-01-28 11:57:58,824 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
116
+ wandb_count: 5
117
+ }
118
+ pusher_stats {
119
+ uploaded_bytes: 3441922
120
+ total_bytes: 3441922
121
+ }
122
+
123
+ 2022-01-28 11:57:58,927 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
124
+ wandb_count: 5
125
+ }
126
+ pusher_stats {
127
+ uploaded_bytes: 3441922
128
+ total_bytes: 3441922
129
+ }
130
+
131
+ 2022-01-28 11:57:59,030 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
132
+ wandb_count: 5
133
+ }
134
+ pusher_stats {
135
+ uploaded_bytes: 3441922
136
+ total_bytes: 3441922
137
+ }
138
+
139
+ 2022-01-28 11:57:59,133 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
140
+ wandb_count: 5
141
+ }
142
+ pusher_stats {
143
+ uploaded_bytes: 3441922
144
+ total_bytes: 3441922
145
+ }
146
+
147
+ 2022-01-28 11:57:59,235 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
148
+ wandb_count: 5
149
+ }
150
+ pusher_stats {
151
+ uploaded_bytes: 3441922
152
+ total_bytes: 3441922
153
+ }
154
+
155
+ 2022-01-28 11:57:59,338 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
156
+ wandb_count: 5
157
+ }
158
+ pusher_stats {
159
+ uploaded_bytes: 3441922
160
+ total_bytes: 3441922
161
+ }
162
+
163
+ 2022-01-28 11:58:00,218 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: file_counts {
164
+ wandb_count: 5
165
+ }
166
+ pusher_stats {
167
+ uploaded_bytes: 3441922
168
+ total_bytes: 3441922
169
+ }
170
+
171
+ 2022-01-28 11:58:00,597 INFO MainThread:2220463 [wandb_run.py:_wait_for_finish():1912] got exit ret: done: true
172
+ exit_result {
173
+ }
174
+ file_counts {
175
+ wandb_count: 5
176
+ }
177
+ pusher_stats {
178
+ uploaded_bytes: 3441922
179
+ total_bytes: 3441922
180
+ }
181
+ local_info {
182
+ }
183
+
184
+ 2022-01-28 11:58:01,703 INFO MainThread:2220463 [wandb_run.py:_append_history():2130] rendering history
185
+ 2022-01-28 11:58:01,705 INFO MainThread:2220463 [wandb_run.py:_append_summary():2085] rendering summary
186
+ 2022-01-28 11:58:01,706 INFO MainThread:2220463 [wandb_run.py:_append_files():2180] logging synced files
wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7e665cf3bd1d21f24efc603dcc4e99707b7439674c0638bb608c504f3187318
3
- size 124718462
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aee0b40e3c968e6e44cf387e6b28e8eb547361393a2c20aa51d507601ce6dd4f
3
+ size 125379374
wandb/run-20220129_111936-33z1cg4n/files/config.yaml ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220129_111936-33z1cg4n/files/output.log ADDED
@@ -0,0 +1,546 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+
4
+
5
+
6
+
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+
60
+
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+
71
+
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+
82
+
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+ 3%|█▋ | 99/3600 [15:46<10:30:00, 10.80s/it]
102
+
103
+
104
+
105
+
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+
183
+
184
+
185
+
186
+
187
+
188
+
189
+
190
+
191
+
192
+
193
+
194
+
195
+
196
+
197
+
198
+
199
+
200
+
201
+
202
+
203
+ 6%|███▍ | 200/3600 [31:33<10:03:22, 10.65s/it]
204
+
205
+
206
+
207
+
208
+
209
+
210
+
211
+
212
+
213
+
214
+
215
+
216
+
217
+
218
+
219
+
220
+
221
+
222
+
223
+
224
+
225
+
226
+
227
+
228
+
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+
248
+
249
+
250
+
251
+
252
+
253
+
254
+
255
+
256
+
257
+
258
+
259
+
260
+
261
+
262
+
263
+
264
+
265
+
266
+
267
+
268
+
269
+
270
+
271
+
272
+
273
+
274
+
275
+
276
+
277
+
278
+
279
+
280
+
281
+
282
+
283
+
284
+
285
+
286
+
287
+
288
+
289
+
290
+
291
+
292
+
293
+
294
+
295
+
296
+
297
+
298
+
299
+
300
+
301
+
302
+
303
+ 8%|█████▏ | 299/3600 [47:03<9:53:18, 10.78s/it]
304
+
305
+
306
+
307
+
308
+
309
+
310
+
311
+
312
+
313
+
314
+
315
+
316
+
317
+
318
+
319
+
320
+
321
+
322
+
323
+
324
+
325
+
326
+
327
+
328
+
329
+
330
+
331
+
332
+
333
+
334
+
335
+
336
+
337
+
338
+
339
+
340
+
341
+
342
+
343
+
344
+
345
+
346
+
347
+
348
+
349
+
350
+
351
+
352
+
353
+
354
+
355
+
356
+
357
+
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+
391
+
392
+
393
+
394
+
395
+
396
+
397
+
398
+
399
+
400
+
401
+
402
+
403
+
404
+ 11%|██████▋ | 399/3600 [1:02:40<9:47:13, 11.01s/it]
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+
413
+
414
+
415
+
416
+
417
+
418
+
419
+
420
+
421
+
422
+
423
+
424
+
425
+
426
+
427
+
428
+
429
+
430
+
431
+
432
+
433
+
434
+
435
+
436
+
437
+
438
+
439
+
440
+
441
+
442
+
443
+
444
+
445
+
446
+
447
+
448
+
449
+
450
+
451
+
452
+
453
+
454
+
455
+
456
+
457
+
458
+
459
+
460
+
461
+
462
+
463
+
464
+
465
+
466
+
467
+
468
+
469
+
470
+
471
+
472
+
473
+
474
+
475
+
476
+
477
+
478
+
479
+
480
+
481
+
482
+
483
+
484
+
485
+
486
+
487
+
488
+
489
+
490
+
491
+
492
+
493
+
494
+
495
+
496
+
497
+
498
+
499
+
500
+
501
+
502
+
503
+
504
+
505
+ 14%|████████▎ | 499/3600 [1:18:15<6:47:48, 7.89s/it]
506
+ 14%|████████▎ | 500/3600 [1:18:20<5:57:31, 6.92s/it]The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
507
+ ***** Running Evaluation *****
508
+ Num examples = 2609
509
+ Batch size = 80
510
+
511
+
512
+
513
+
514
+
515
+
516
+
517
+
518
+
519
+
520
+
521
+
522
+
523
+
524
+
525
+
526
+
527
+
528
+
529
+
530
+
531
+
532
+
533
+
534
+
535
+
536
+
537
+
538
+
539
+
540
+
541
+
542
+ 100%|███████████████████████████████████████████████████████████████████| 33/33 [02:06<00:00, 2.59s/it]
543
+
544
+ Configuration saved in ./checkpoint-500/config.json
545
+ Model weights saved in ./checkpoint-500/pytorch_model.bin
546
+ Configuration saved in ./checkpoint-500/preprocessor_config.json
wandb/run-20220129_111936-33z1cg4n/files/requirements.txt ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ aiohttp==3.8.1
2
+ aiosignal==1.2.0
3
+ appdirs==1.4.4
4
+ async-timeout==4.0.2
5
+ attrs==21.4.0
6
+ audioread==2.1.9
7
+ bitsandbytes-cuda113==0.26.0
8
+ certifi==2021.10.8
9
+ cffi==1.15.0
10
+ charset-normalizer==2.0.10
11
+ click==8.0.3
12
+ clldutils==3.10.1
13
+ colorlog==6.6.0
14
+ configparser==5.2.0
15
+ csvw==1.11.0
16
+ datasets==1.18.1.dev0
17
+ decorator==5.1.1
18
+ dill==0.3.4
19
+ dlinfo==1.2.1
20
+ docker-pycreds==0.4.0
21
+ filelock==3.4.2
22
+ frozenlist==1.3.0
23
+ fsspec==2022.1.0
24
+ gitdb==4.0.9
25
+ gitpython==3.1.26
26
+ huggingface-hub==0.4.0
27
+ hypothesis==6.36.0
28
+ idna==3.3
29
+ isodate==0.6.1
30
+ jiwer==2.3.0
31
+ joblib==1.1.0
32
+ librosa==0.8.1
33
+ llvmlite==0.38.0
34
+ multidict==6.0.2
35
+ multiprocess==0.70.12.2
36
+ numba==0.55.0
37
+ numpy==1.21.5
38
+ packaging==21.3
39
+ pandas==1.4.0
40
+ pathtools==0.1.2
41
+ phonemizer==3.0.1
42
+ pip==21.3.1
43
+ pooch==1.6.0
44
+ promise==2.3
45
+ protobuf==3.19.3
46
+ psutil==5.9.0
47
+ pyarrow==6.0.1
48
+ pycparser==2.21
49
+ pyctcdecode==0.3.0
50
+ pygtrie==2.4.2
51
+ pyparsing==3.0.7
52
+ python-dateutil==2.8.2
53
+ python-levenshtein==0.12.2
54
+ pytz==2021.3
55
+ pyyaml==6.0
56
+ regex==2022.1.18
57
+ requests==2.27.1
58
+ resampy==0.2.2
59
+ rfc3986==2.0.0
60
+ sacremoses==0.0.47
61
+ scikit-learn==1.0.2
62
+ scipy==1.7.3
63
+ segments==2.2.0
64
+ sentry-sdk==1.5.4
65
+ setuptools==60.2.0
66
+ shortuuid==1.0.8
67
+ six==1.16.0
68
+ smmap==5.0.0
69
+ sortedcontainers==2.4.0
70
+ soundfile==0.10.3.post1
71
+ subprocess32==3.5.4
72
+ tabulate==0.8.9
73
+ termcolor==1.1.0
74
+ threadpoolctl==3.0.0
75
+ tokenizers==0.11.4
76
+ torch==1.10.1
77
+ torchaudio==0.10.1
78
+ tqdm==4.62.3
79
+ transformers==4.16.0.dev0
80
+ typing-extensions==4.0.1
81
+ uritemplate==4.1.1
82
+ urllib3==1.26.8
83
+ wandb==0.12.9
84
+ wheel==0.37.1
85
+ xxhash==2.0.2
86
+ yarl==1.7.2
87
+ yaspin==2.1.0
wandb/run-20220129_111936-33z1cg4n/files/wandb-metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-4.18.0-305.10.2.el8_4.x86_64-x86_64-with-glibc2.28",
3
+ "python": "3.9.6",
4
+ "heartbeatAt": "2022-01-29T16:19:37.625823",
5
+ "startedAt": "2022-01-29T16:19:36.629047",
6
+ "docker": null,
7
+ "gpu": "Tesla V100-PCIE-32GB",
8
+ "gpu_count": 3,
9
+ "cpu_count": 64,
10
+ "cuda": null,
11
+ "args": [
12
+ "--dataset_name=mozilla-foundation/common_voice_7_0",
13
+ "--model_name_or_path=facebook/wav2vec2-xls-r-300m",
14
+ "--dataset_config_name=et",
15
+ "--output_dir=./",
16
+ "--overwrite_output_dir",
17
+ "--num_train_epochs=100",
18
+ "--per_device_train_batch_size=80",
19
+ "--per_device_eval_batch_size=80",
20
+ "--gradient_accumulation_steps=2",
21
+ "--learning_rate=3e-4",
22
+ "--save_total_limit=1",
23
+ "--warmup_steps=500",
24
+ "--evaluation_strategy=steps",
25
+ "--text_column_name=sentence",
26
+ "--length_column_name=input_length",
27
+ "--save_steps=500",
28
+ "--eval_steps=500",
29
+ "--logging_steps=100",
30
+ "--layerdrop=0.0",
31
+ "--freeze_feature_encoder",
32
+ "--feat_proj_dropout=0.1",
33
+ "--chars_to_ignore",
34
+ ",",
35
+ "?",
36
+ ".",
37
+ "!",
38
+ "-",
39
+ ";",
40
+ ":",
41
+ "\"",
42
+ "\u201c",
43
+ "%",
44
+ "\u2018",
45
+ "\u201d",
46
+ "\ufffd",
47
+ "\u2014",
48
+ "\u2019",
49
+ "\u2026",
50
+ "\u2013",
51
+ "--gradient_checkpointing",
52
+ "--lr_scheduler_type=cosine",
53
+ "--fp16",
54
+ "--group_by_length",
55
+ "--mask_time_prob=0.1",
56
+ "--mask_time_length=10",
57
+ "--report_to=wandb",
58
+ "--run_name=cosine+drop_proj+low_specaugment-300M",
59
+ "--do_train",
60
+ "--do_eval",
61
+ "--use_auth_token",
62
+ "--push_to_hub"
63
+ ],
64
+ "state": "running",
65
+ "program": "/home/sagrilaft/Project/audio/xls-r-et/src/run_speech_recognition_ctc_bnb.py",
66
+ "codePath": "src/run_speech_recognition_ctc_bnb.py",
67
+ "git": {
68
+ "remote": "https://huggingface.co/shpotes/xls-r-et",
69
+ "commit": "fa2a9d24f0bae1b5002fb327d3cfa727ef5b4caf"
70
+ },
71
+ "email": "shpotes3@gmail.com",
72
+ "root": "/home/sagrilaft/Project/audio/xls-r-et",
73
+ "host": "ganymede.eafit.edu.co",
74
+ "username": "sagrilaft",
75
+ "executable": "/home/sagrilaft/Project/audio/xls-r-et/.venv/bin/python"
76
+ }
wandb/run-20220129_111936-33z1cg4n/files/wandb-summary.json ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220129_111936-33z1cg4n/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220129_111936-33z1cg4n/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2022-01-29 11:19:36,632 INFO MainThread:2523114 [wandb_setup.py:_flush():71] setting env: {'project': 'xls-r-estonian'}
2
+ 2022-01-29 11:19:36,632 INFO MainThread:2523114 [wandb_setup.py:_flush():71] setting login settings: {}
3
+ 2022-01-29 11:19:36,632 INFO MainThread:2523114 [wandb_init.py:_log_setup():371] Logging user logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220129_111936-33z1cg4n/logs/debug.log
4
+ 2022-01-29 11:19:36,632 INFO MainThread:2523114 [wandb_init.py:_log_setup():372] Logging internal logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220129_111936-33z1cg4n/logs/debug-internal.log
5
+ 2022-01-29 11:19:36,633 INFO MainThread:2523114 [wandb_init.py:init():404] calling init triggers
6
+ 2022-01-29 11:19:36,633 INFO MainThread:2523114 [wandb_init.py:init():409] wandb.init called with sweep_config: {}
7
+ config: {}
8
+ 2022-01-29 11:19:36,633 INFO MainThread:2523114 [wandb_init.py:init():460] starting backend
9
+ 2022-01-29 11:19:36,633 INFO MainThread:2523114 [backend.py:_multiprocessing_setup():99] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
10
+ 2022-01-29 11:19:36,666 INFO MainThread:2523114 [backend.py:ensure_launched():216] starting backend process...
11
+ 2022-01-29 11:19:36,693 INFO MainThread:2523114 [backend.py:ensure_launched():221] started backend process with pid: 2523574
12
+ 2022-01-29 11:19:36,694 INFO MainThread:2523114 [wandb_init.py:init():469] backend started and connected
13
+ 2022-01-29 11:19:36,701 INFO MainThread:2523114 [wandb_init.py:init():533] updated telemetry
14
+ 2022-01-29 11:19:36,765 INFO MainThread:2523114 [wandb_init.py:init():563] communicating current version
15
+ 2022-01-29 11:19:37,425 INFO MainThread:2523114 [wandb_init.py:init():568] got version response
16
+ 2022-01-29 11:19:37,426 INFO MainThread:2523114 [wandb_init.py:init():578] communicating run to backend with 30 second timeout
17
+ 2022-01-29 11:19:37,617 INFO MainThread:2523114 [wandb_init.py:init():606] starting run threads in backend
18
+ 2022-01-29 11:19:37,676 INFO MainThread:2523114 [wandb_run.py:_console_start():1810] atexit reg
19
+ 2022-01-29 11:19:37,677 INFO MainThread:2523114 [wandb_run.py:_redirect():1684] redirect: SettingsConsole.REDIRECT
20
+ 2022-01-29 11:19:37,677 INFO MainThread:2523114 [wandb_run.py:_redirect():1689] Redirecting console.
21
+ 2022-01-29 11:19:37,680 INFO MainThread:2523114 [wandb_run.py:_redirect():1745] Redirects installed.
22
+ 2022-01-29 11:19:37,680 INFO MainThread:2523114 [wandb_init.py:init():633] run started, returning control to user process
23
+ 2022-01-29 11:19:37,694 INFO MainThread:2523114 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 36, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 39, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.1, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.0, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 80, 'per_device_eval_batch_size': 80, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 0.0003, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 100.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'warmup_ratio': 0.0, 'warmup_steps': 500, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan29_11-17-08_ganymede.eafit.edu.co', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 1, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': 'cosine+drop_proj+low_specaugment-300M', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 80, 'eval_batch_size': 80}
24
+ 2022-01-29 11:19:37,697 INFO MainThread:2523114 [wandb_watch.py:watch():43] Watching
wandb/run-20220129_111936-33z1cg4n/run-33z1cg4n.wandb ADDED
Binary file (3.52 MB). View file