ayameRushia commited on
Commit
8543a98
1 Parent(s): dc39b02

Training in progress, step 500

Browse files
.ipynb_checkpoints/run-checkpoint.sh CHANGED
@@ -4,11 +4,11 @@ python run_speech_recognition_ctc.py \
4
  --dataset_config_name="el" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
- --num_train_epochs="40" \
8
  --per_device_train_batch_size="32" \
9
  --gradient_accumulation_steps="2" \
10
  --learning_rate="5e-5" \
11
- --warmup_steps="1000" \
12
  --lr_scheduler_type="linear" \
13
  --feat_proj_dropout="0.1" \
14
  --attention_dropout="0.1" \
@@ -18,8 +18,8 @@ python run_speech_recognition_ctc.py \
18
  --evaluation_strategy="steps" \
19
  --text_column_name="sentence" \
20
  --length_column_name="input_length" \
21
- --save_steps="1000" \
22
- --eval_steps="400" \
23
  --layerdrop="0.0" \
24
  --save_total_limit="2" \
25
  --freeze_feature_encoder \
 
4
  --dataset_config_name="el" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
+ --num_train_epochs="80" \
8
  --per_device_train_batch_size="32" \
9
  --gradient_accumulation_steps="2" \
10
  --learning_rate="5e-5" \
11
+ --warmup_steps="400" \
12
  --lr_scheduler_type="linear" \
13
  --feat_proj_dropout="0.1" \
14
  --attention_dropout="0.1" \
 
18
  --evaluation_strategy="steps" \
19
  --text_column_name="sentence" \
20
  --length_column_name="input_length" \
21
+ --save_steps="500" \
22
+ --eval_steps="500" \
23
  --layerdrop="0.0" \
24
  --save_total_limit="2" \
25
  --freeze_feature_encoder \
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f5416c25274021c86ac8b1598fd021bfae47e384c96367caf69013bad81241f
3
  size 1262132785
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbcdd6e77557731974267ab6f87f16eb50dc8e354267250c951df02997cc6db0
3
  size 1262132785
run.sh CHANGED
@@ -4,7 +4,7 @@ python run_speech_recognition_ctc.py \
4
  --dataset_config_name="el" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
- --num_train_epochs="40" \
8
  --per_device_train_batch_size="32" \
9
  --gradient_accumulation_steps="2" \
10
  --learning_rate="5e-5" \
@@ -18,8 +18,8 @@ python run_speech_recognition_ctc.py \
18
  --evaluation_strategy="steps" \
19
  --text_column_name="sentence" \
20
  --length_column_name="input_length" \
21
- --save_steps="1000" \
22
- --eval_steps="400" \
23
  --layerdrop="0.0" \
24
  --save_total_limit="2" \
25
  --freeze_feature_encoder \
 
4
  --dataset_config_name="el" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
+ --num_train_epochs="80" \
8
  --per_device_train_batch_size="32" \
9
  --gradient_accumulation_steps="2" \
10
  --learning_rate="5e-5" \
 
18
  --evaluation_strategy="steps" \
19
  --text_column_name="sentence" \
20
  --length_column_name="input_length" \
21
+ --save_steps="500" \
22
+ --eval_steps="500" \
23
  --layerdrop="0.0" \
24
  --save_total_limit="2" \
25
  --freeze_feature_encoder \
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:319739be0b8c57a290a35449f4033858ca110fe3f2f3563987386ce1d776afec
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cdb010419a9871a35ab482d0abfa3068a8f870c9ba360d2ea0173560ab60642
3
  size 2991
wandb/debug-internal.log CHANGED
@@ -1 +1 @@
1
- run-20220204_152118-2dc06ifr/logs/debug-internal.log
 
1
+ run-20220204_170031-gzsqxey3/logs/debug-internal.log
wandb/debug.log CHANGED
@@ -1 +1 @@
1
- run-20220204_152118-2dc06ifr/logs/debug.log
 
1
+ run-20220204_170031-gzsqxey3/logs/debug.log
wandb/latest-run CHANGED
@@ -1 +1 @@
1
- run-20220204_152118-2dc06ifr
 
1
+ run-20220204_170031-gzsqxey3
wandb/run-20220204_152118-2dc06ifr/files/output.log CHANGED
@@ -2129,3 +2129,13 @@ Configuration saved in ./preprocessor_config.json
2129
  Configuration saved in ./checkpoint-2000/config.json
2130
  Model weights saved in ./checkpoint-2000/pytorch_model.bin
2131
  Configuration saved in ./checkpoint-2000/preprocessor_config.json
 
 
 
 
 
 
 
 
 
 
 
2129
  Configuration saved in ./checkpoint-2000/config.json
2130
  Model weights saved in ./checkpoint-2000/pytorch_model.bin
2131
  Configuration saved in ./checkpoint-2000/preprocessor_config.json
2132
+ Configuration saved in ./preprocessor_config.json
2133
+
2134
+
2135
+
2136
+
2137
+
2138
+
2139
+
2140
+
2141
+
wandb/run-20220204_152118-2dc06ifr/logs/debug-internal.log CHANGED
@@ -4337,3 +4337,38 @@
4337
  2022-02-04 16:58:14,679 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
4338
  2022-02-04 16:58:29,844 DEBUG HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
4339
  2022-02-04 16:58:29,845 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4337
  2022-02-04 16:58:14,679 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
4338
  2022-02-04 16:58:29,844 DEBUG HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
4339
  2022-02-04 16:58:29,845 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
4340
+ 2022-02-04 16:58:38,298 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4341
+ 2022-02-04 16:58:39,288 DEBUG SenderThread:583863 [sender.py:send():234] send: stats
4342
+ 2022-02-04 16:58:41,300 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4343
+ 2022-02-04 16:58:43,303 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4344
+ 2022-02-04 16:58:45,015 DEBUG HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
4345
+ 2022-02-04 16:58:45,015 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
4346
+ 2022-02-04 16:58:47,305 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4347
+ 2022-02-04 16:58:49,307 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4348
+ 2022-02-04 16:58:51,308 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4349
+ 2022-02-04 16:58:53,309 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4350
+ 2022-02-04 16:58:55,310 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4351
+ 2022-02-04 16:59:00,175 DEBUG HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
4352
+ 2022-02-04 16:59:00,175 DEBUG SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
4353
+ 2022-02-04 16:59:01,313 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4354
+ 2022-02-04 16:59:04,716 WARNING MainThread:583863 [internal.py:wandb_internal():146] Internal process interrupt: 1
4355
+ 2022-02-04 16:59:05,315 INFO Thread-8 :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4356
+ 2022-02-04 16:59:05,510 WARNING MainThread:583863 [internal.py:wandb_internal():146] Internal process interrupt: 2
4357
+ 2022-02-04 16:59:05,510 ERROR MainThread:583863 [internal.py:wandb_internal():149] Internal process interrupted.
4358
+ 2022-02-04 16:59:06,493 INFO SenderThread:583863 [sender.py:finish():1070] shutting down sender
4359
+ 2022-02-04 16:59:06,493 INFO WriterThread:583863 [datastore.py:close():281] close: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb
4360
+ 2022-02-04 16:59:06,494 INFO SenderThread:583863 [dir_watcher.py:finish():283] shutting down directory watcher
4361
+ 2022-02-04 16:59:07,317 INFO SenderThread:583863 [dir_watcher.py:finish():313] scan: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files
4362
+ 2022-02-04 16:59:07,318 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-metadata.json wandb-metadata.json
4363
+ 2022-02-04 16:59:07,318 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log output.log
4364
+ 2022-02-04 16:59:07,318 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/requirements.txt requirements.txt
4365
+ 2022-02-04 16:59:07,348 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-summary.json wandb-summary.json
4366
+ 2022-02-04 16:59:07,354 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/config.yaml config.yaml
4367
+ 2022-02-04 16:59:07,356 INFO SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/conda-environment.yaml conda-environment.yaml
4368
+ 2022-02-04 16:59:07,366 INFO SenderThread:583863 [file_pusher.py:finish():177] shutting down file pusher
4369
+ 2022-02-04 16:59:07,367 INFO SenderThread:583863 [file_pusher.py:join():182] waiting for file pusher
4370
+ 2022-02-04 16:59:07,895 INFO Thread-12 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
4371
+ 2022-02-04 16:59:07,991 INFO Thread-13 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/requirements.txt
4372
+ 2022-02-04 16:59:08,129 INFO Thread-14 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-summary.json
4373
+ 2022-02-04 16:59:08,134 INFO Thread-15 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/config.yaml
4374
+ 2022-02-04 16:59:08,848 INFO MainThread:583863 [internal.py:handle_exit():77] Internal process exited
wandb/run-20220204_152118-2dc06ifr/logs/debug.log CHANGED
@@ -24,3 +24,5 @@ config: {}
24
  2022-02-04 15:21:20,512 INFO MainThread:582896 [wandb_init.py:init():633] run started, returning control to user process
25
  2022-02-04 15:21:20,515 INFO MainThread:582896 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 40.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_15-19-01_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 1000, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 400, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
26
  2022-02-04 15:21:20,519 INFO MainThread:582896 [wandb_watch.py:watch():43] Watching
 
 
 
24
  2022-02-04 15:21:20,512 INFO MainThread:582896 [wandb_init.py:init():633] run started, returning control to user process
25
  2022-02-04 15:21:20,515 INFO MainThread:582896 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 40.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_15-19-01_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 1000, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 400, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
26
  2022-02-04 15:21:20,519 INFO MainThread:582896 [wandb_watch.py:watch():43] Watching
27
+ 2022-02-04 16:59:04,749 INFO MainThread:582896 [wandb_run.py:_atexit_cleanup():1780] got exitcode: 255
28
+ 2022-02-04 16:59:04,751 INFO MainThread:582896 [wandb_run.py:_restore():1752] restore
wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb CHANGED
Binary files a/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb and b/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb differ
 
wandb/run-20220204_170031-gzsqxey3/files/conda-environment.yaml ADDED
File without changes
wandb/run-20220204_170031-gzsqxey3/files/config.yaml ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220204_170031-gzsqxey3/files/output.log ADDED
@@ -0,0 +1,533 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+
4
+
5
+
6
+
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+
60
+
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+
71
+
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+
82
+
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+
105
+
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+
183
+
184
+
185
+
186
+
187
+
188
+
189
+
190
+
191
+
192
+
193
+
194
+
195
+
196
+
197
+
198
+
199
+
200
+
201
+
202
+
203
+
204
+
205
+
206
+
207
+
208
+
209
+
210
+
211
+
212
+
213
+
214
+
215
+
216
+
217
+
218
+
219
+
220
+
221
+
222
+
223
+
224
+
225
+
226
+
227
+
228
+
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+
248
+
249
+
250
+
251
+
252
+
253
+
254
+
255
+
256
+
257
+
258
+
259
+
260
+
261
+
262
+
263
+
264
+
265
+
266
+
267
+
268
+
269
+
270
+
271
+
272
+
273
+
274
+
275
+
276
+
277
+
278
+
279
+
280
+
281
+
282
+
283
+
284
+
285
+
286
+
287
+
288
+
289
+
290
+
291
+
292
+
293
+
294
+
295
+
296
+
297
+
298
+
299
+
300
+
301
+
302
+
303
+
304
+
305
+
306
+
307
+
308
+
309
+
310
+
311
+
312
+
313
+
314
+
315
+
316
+
317
+
318
+
319
+
320
+
321
+
322
+
323
+
324
+
325
+
326
+
327
+
328
+
329
+
330
+
331
+
332
+
333
+
334
+
335
+
336
+
337
+
338
+
339
+
340
+
341
+
342
+
343
+
344
+
345
+
346
+
347
+
348
+
349
+
350
+
351
+
352
+
353
+
354
+
355
+
356
+
357
+
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+
391
+
392
+
393
+
394
+
395
+
396
+
397
+
398
+
399
+
400
+
401
+
402
+
403
+
404
+
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+
413
+
414
+
415
+
416
+
417
+
418
+
419
+
420
+
421
+
422
+
423
+
424
+
425
+
426
+
427
+
428
+
429
+
430
+
431
+
432
+
433
+
434
+
435
+
436
+
437
+
438
+
439
+
440
+
441
+
442
+
443
+
444
+
445
+
446
+
447
+
448
+
449
+
450
+
451
+
452
+
453
+
454
+
455
+
456
+
457
+
458
+
459
+
460
+
461
+
462
+
463
+
464
+
465
+
466
+
467
+
468
+
469
+
470
+
471
+
472
+
473
+
474
+
475
+
476
+
477
+
478
+
479
+
480
+
481
+
482
+
483
+
484
+
485
+
486
+
487
+
488
+
489
+
490
+
491
+
492
+
493
+
494
+
495
+ 11%|███████ | 499/4560 [23:43<3:19:11, 2.94s/it]
496
+ 11%|███████ | 500/4560 [23:47<3:44:34, 3.32s/it]The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
497
+ ***** Running Evaluation *****
498
+ Num examples = 1681
499
+ Batch size = 8
500
+
501
+
502
+
503
+
504
+
505
+
506
+
507
+
508
+
509
+
510
+
511
+
512
+
513
+
514
+
515
+
516
+
517
+
518
+
519
+
520
+
521
+
522
+
523
+
524
+
525
+
526
+
527
+
528
+
529
+
530
+ Configuration saved in ./checkpoint-500/config.json
531
+ {'eval_loss': 3.128021001815796, 'eval_wer': 1.0, 'eval_runtime': 61.7966, 'eval_samples_per_second': 27.202, 'eval_steps_per_second': 3.414, 'epoch': 8.77}
532
+ Model weights saved in ./checkpoint-500/pytorch_model.bin
533
+ Configuration saved in ./checkpoint-500/preprocessor_config.json
wandb/run-20220204_170031-gzsqxey3/files/requirements.txt ADDED
@@ -0,0 +1,171 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ -atasets==1.17.1.dev0
2
+ -ransformers==4.16.0.dev0
3
+ aiohttp==3.8.1
4
+ aiosignal==1.2.0
5
+ analytics-python==1.4.0
6
+ appdirs==1.4.4
7
+ argon2-cffi==20.1.0
8
+ async-generator==1.10
9
+ async-timeout==4.0.2
10
+ attrs==21.1.0
11
+ audioread==2.1.9
12
+ backcall==0.2.0
13
+ backoff==1.10.0
14
+ bcrypt==3.2.0
15
+ beautifulsoup4==4.9.3
16
+ bleach==3.3.0
17
+ brotlipy==0.7.0
18
+ certifi==2020.12.5
19
+ cffi==1.14.3
20
+ chardet==3.0.4
21
+ charset-normalizer==2.0.10
22
+ click==8.0.3
23
+ conda-build==3.21.4
24
+ conda-package-handling==1.7.2
25
+ conda==4.9.2
26
+ configparser==5.2.0
27
+ cryptography==3.2.1
28
+ cycler==0.11.0
29
+ datasets==1.18.3
30
+ decorator==4.4.2
31
+ defusedxml==0.7.1
32
+ dill==0.3.4
33
+ dnspython==2.1.0
34
+ docker-pycreds==0.4.0
35
+ entrypoints==0.3
36
+ ffmpy==0.3.0
37
+ filelock==3.0.12
38
+ flask-cachebuster==1.0.0
39
+ flask-cors==3.0.10
40
+ flask-login==0.5.0
41
+ flask==2.0.2
42
+ fonttools==4.28.5
43
+ frozenlist==1.3.0
44
+ fsspec==2022.1.0
45
+ gitdb==4.0.9
46
+ gitpython==3.1.26
47
+ glob2==0.7
48
+ gradio==2.7.0
49
+ huggingface-hub==0.4.0
50
+ hypothesis==6.36.1
51
+ idna==2.10
52
+ ipykernel==5.5.4
53
+ ipython-genutils==0.2.0
54
+ ipython==7.21.0
55
+ ipywidgets==7.6.3
56
+ itsdangerous==2.0.1
57
+ jedi==0.17.0
58
+ jinja2==3.0.3
59
+ jiwer==2.3.0
60
+ joblib==1.1.0
61
+ json5==0.9.5
62
+ jsonschema==3.2.0
63
+ jupyter-client==6.1.12
64
+ jupyter-core==4.7.1
65
+ jupyterlab-pygments==0.1.2
66
+ jupyterlab-server==1.2.0
67
+ jupyterlab-widgets==1.0.0
68
+ jupyterlab==2.2.9
69
+ kenlm==0.0.0
70
+ kiwisolver==1.3.2
71
+ libarchive-c==2.9
72
+ librosa==0.8.1
73
+ llvmlite==0.38.0
74
+ markdown2==2.4.2
75
+ markupsafe==2.0.1
76
+ matplotlib==3.5.1
77
+ mistune==0.8.4
78
+ mkl-fft==1.3.0
79
+ mkl-random==1.1.1
80
+ mkl-service==2.3.0
81
+ monotonic==1.6
82
+ multidict==5.2.0
83
+ multiprocess==0.70.12.2
84
+ nano==0.10.0
85
+ nbclient==0.5.3
86
+ nbconvert==6.0.7
87
+ nbformat==5.1.3
88
+ nest-asyncio==1.5.1
89
+ notebook==6.3.0
90
+ numba==0.55.0
91
+ numpy==1.19.2
92
+ olefile==0.46
93
+ packaging==20.9
94
+ pandas==1.3.5
95
+ pandocfilters==1.4.3
96
+ paramiko==2.9.2
97
+ parso==0.8.1
98
+ pathtools==0.1.2
99
+ pexpect==4.8.0
100
+ pickleshare==0.7.5
101
+ pillow==8.1.2
102
+ pip==21.3.1
103
+ pkginfo==1.7.0
104
+ pooch==1.5.2
105
+ prometheus-client==0.10.1
106
+ promise==2.3
107
+ prompt-toolkit==3.0.8
108
+ protobuf==3.19.3
109
+ psutil==5.8.0
110
+ ptyprocess==0.7.0
111
+ pyarrow==6.0.1
112
+ pycosat==0.6.3
113
+ pycparser==2.20
114
+ pycryptodome==3.12.0
115
+ pyctcdecode==0.3.0
116
+ pydub==0.25.1
117
+ pygments==2.8.0
118
+ pygtrie==2.4.2
119
+ pynacl==1.5.0
120
+ pyopenssl==19.1.0
121
+ pyparsing==2.4.7
122
+ pyrsistent==0.17.3
123
+ pysocks==1.7.1
124
+ python-dateutil==2.8.1
125
+ python-etcd==0.4.5
126
+ python-levenshtein==0.12.2
127
+ pytz==2021.1
128
+ pyyaml==5.4.1
129
+ pyzmq==22.0.3
130
+ regex==2022.1.18
131
+ requests==2.24.0
132
+ resampy==0.2.2
133
+ ruamel-yaml==0.15.87
134
+ sacremoses==0.0.47
135
+ scikit-learn==1.0.2
136
+ scipy==1.7.3
137
+ send2trash==1.5.0
138
+ sentry-sdk==1.5.4
139
+ setuptools==50.3.1.post20201107
140
+ shortuuid==1.0.8
141
+ six==1.15.0
142
+ smmap==5.0.0
143
+ sortedcontainers==2.4.0
144
+ soundfile==0.10.3.post1
145
+ soupsieve==2.2
146
+ subprocess32==3.5.4
147
+ termcolor==1.1.0
148
+ terminado==0.9.4
149
+ testpath==0.4.4
150
+ threadpoolctl==3.0.0
151
+ tokenizers==0.11.4
152
+ torch==1.10.1
153
+ torchaudio==0.10.1
154
+ torchelastic==0.2.2
155
+ torchtext==0.9.1
156
+ torchvision==0.9.1
157
+ tornado==6.1
158
+ tqdm==4.62.3
159
+ traitlets==5.0.5
160
+ transformers==4.17.0.dev0
161
+ typing-extensions==3.7.4.3
162
+ urllib3==1.25.11
163
+ wandb==0.12.9
164
+ wcwidth==0.2.5
165
+ webencodings==0.5.1
166
+ werkzeug==2.0.2
167
+ wheel==0.35.1
168
+ widgetsnbextension==3.5.1
169
+ xxhash==2.0.2
170
+ yarl==1.7.2
171
+ yaspin==2.1.0
wandb/run-20220204_170031-gzsqxey3/files/wandb-metadata.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.11.0-37-generic-x86_64-with-glibc2.10",
3
+ "python": "3.8.8",
4
+ "heartbeatAt": "2022-02-04T17:00:32.947275",
5
+ "startedAt": "2022-02-04T17:00:31.683578",
6
+ "docker": null,
7
+ "gpu": "Tesla V100S-PCIE-32GB",
8
+ "gpu_count": 1,
9
+ "cpu_count": 60,
10
+ "cuda": null,
11
+ "args": [
12
+ "--dataset_name=mozilla-foundation/common_voice_8_0",
13
+ "--model_name_or_path=facebook/wav2vec2-xls-r-300m",
14
+ "--dataset_config_name=el",
15
+ "--output_dir=./",
16
+ "--overwrite_output_dir",
17
+ "--num_train_epochs=80",
18
+ "--per_device_train_batch_size=32",
19
+ "--gradient_accumulation_steps=2",
20
+ "--learning_rate=5e-5",
21
+ "--warmup_steps=400",
22
+ "--lr_scheduler_type=linear",
23
+ "--feat_proj_dropout=0.1",
24
+ "--attention_dropout=0.1",
25
+ "--max_duration_in_seconds=15",
26
+ "--mask_time_prob=0.4",
27
+ "--mask_feature_prob=0.1",
28
+ "--evaluation_strategy=steps",
29
+ "--text_column_name=sentence",
30
+ "--length_column_name=input_length",
31
+ "--save_steps=500",
32
+ "--eval_steps=500",
33
+ "--layerdrop=0.0",
34
+ "--save_total_limit=2",
35
+ "--freeze_feature_encoder",
36
+ "--gradient_checkpointing",
37
+ "--fp16",
38
+ "--push_to_hub",
39
+ "--group_by_length",
40
+ "--do_train",
41
+ "--do_eval"
42
+ ],
43
+ "state": "running",
44
+ "program": "run_speech_recognition_ctc.py",
45
+ "codePath": "run_speech_recognition_ctc.py",
46
+ "git": {
47
+ "remote": "https://huggingface.co/ayameRushia/wav2vec2-large-xls-r-300m-el",
48
+ "commit": "dc39b02954010cda629c3aadbcb5e0ab724f8d16"
49
+ },
50
+ "email": "magunghambali@gmail.com",
51
+ "root": "/workspace/wav2vec2-large-xls-r-300m-el",
52
+ "host": "job-1c325595-1ca8-441f-8e94-43b2937c71d2",
53
+ "username": "ovh",
54
+ "executable": "/opt/conda/bin/python"
55
+ }
wandb/run-20220204_170031-gzsqxey3/files/wandb-summary.json ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220204_170031-gzsqxey3/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220204_170031-gzsqxey3/logs/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2022-02-04 17:00:31,686 INFO MainThread:622234 [wandb_setup.py:_flush():71] Unhandled environment var: WANDB_RUN
2
+ 2022-02-04 17:00:31,686 INFO MainThread:622234 [wandb_setup.py:_flush():71] setting env: {'project': 'wav2vec2-mn-1', 'run_name': 'run dataset 1.18.3'}
3
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_setup.py:_flush():71] setting login settings: {}
4
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_init.py:_log_setup():371] Logging user logs to /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_170031-gzsqxey3/logs/debug.log
5
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_init.py:_log_setup():372] Logging internal logs to /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_170031-gzsqxey3/logs/debug-internal.log
6
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_init.py:init():404] calling init triggers
7
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_init.py:init():409] wandb.init called with sweep_config: {}
8
+ config: {}
9
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [wandb_init.py:init():460] starting backend
10
+ 2022-02-04 17:00:31,687 INFO MainThread:622234 [backend.py:_multiprocessing_setup():99] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
11
+ 2022-02-04 17:00:31,762 INFO MainThread:622234 [backend.py:ensure_launched():216] starting backend process...
12
+ 2022-02-04 17:00:31,853 INFO MainThread:622234 [backend.py:ensure_launched():221] started backend process with pid: 622748
13
+ 2022-02-04 17:00:31,856 INFO MainThread:622234 [wandb_init.py:init():469] backend started and connected
14
+ 2022-02-04 17:00:31,866 INFO MainThread:622234 [wandb_init.py:init():533] updated telemetry
15
+ 2022-02-04 17:00:32,016 INFO MainThread:622234 [wandb_init.py:init():563] communicating current version
16
+ 2022-02-04 17:00:32,744 INFO MainThread:622234 [wandb_init.py:init():568] got version response upgrade_message: "wandb version 0.12.10 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
17
+
18
+ 2022-02-04 17:00:32,744 INFO MainThread:622234 [wandb_init.py:init():578] communicating run to backend with 30 second timeout
19
+ 2022-02-04 17:00:32,936 INFO MainThread:622234 [wandb_init.py:init():606] starting run threads in backend
20
+ 2022-02-04 17:00:33,569 INFO MainThread:622234 [wandb_run.py:_console_start():1810] atexit reg
21
+ 2022-02-04 17:00:33,570 INFO MainThread:622234 [wandb_run.py:_redirect():1684] redirect: SettingsConsole.REDIRECT
22
+ 2022-02-04 17:00:33,571 INFO MainThread:622234 [wandb_run.py:_redirect():1689] Redirecting console.
23
+ 2022-02-04 17:00:33,575 INFO MainThread:622234 [wandb_run.py:_redirect():1745] Redirects installed.
24
+ 2022-02-04 17:00:33,575 INFO MainThread:622234 [wandb_init.py:init():633] run started, returning control to user process
25
+ 2022-02-04 17:00:33,579 INFO MainThread:622234 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 80.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 400, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_16-59-26_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
26
+ 2022-02-04 17:00:33,583 INFO MainThread:622234 [wandb_watch.py:watch():43] Watching
wandb/run-20220204_170031-gzsqxey3/run-gzsqxey3.wandb ADDED
Binary file (803 kB). View file