ayameRushia commited on Feb 4, 2022

Commit

8543a98

•

1 Parent(s): dc39b02

Training in progress, step 500

Browse files

Files changed (21) hide show

.ipynb_checkpoints/run-checkpoint.sh +4 -4
pytorch_model.bin +1 -1
run.sh +3 -3
special_tokens_map.json +1 -1
training_args.bin +1 -1
wandb/debug-internal.log +1 -1
wandb/debug.log +1 -1
wandb/latest-run +1 -1
wandb/run-20220204_152118-2dc06ifr/files/output.log +10 -0
wandb/run-20220204_152118-2dc06ifr/logs/debug-internal.log +35 -0
wandb/run-20220204_152118-2dc06ifr/logs/debug.log +2 -0
wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb +0 -0
wandb/run-20220204_170031-gzsqxey3/files/conda-environment.yaml +0 -0
wandb/run-20220204_170031-gzsqxey3/files/config.yaml +0 -0
wandb/run-20220204_170031-gzsqxey3/files/output.log +533 -0
wandb/run-20220204_170031-gzsqxey3/files/requirements.txt +171 -0
wandb/run-20220204_170031-gzsqxey3/files/wandb-metadata.json +55 -0
wandb/run-20220204_170031-gzsqxey3/files/wandb-summary.json +0 -0
wandb/run-20220204_170031-gzsqxey3/logs/debug-internal.log +0 -0
wandb/run-20220204_170031-gzsqxey3/logs/debug.log +26 -0
wandb/run-20220204_170031-gzsqxey3/run-gzsqxey3.wandb +0 -0

.ipynb_checkpoints/run-checkpoint.sh CHANGED Viewed

@@ -4,11 +4,11 @@ python run_speech_recognition_ctc.py \
 	--dataset_config_name="el" \
 	--output_dir="./" \
 	--overwrite_output_dir \
-	--num_train_epochs="40" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="2" \
 	--learning_rate="5e-5" \
-	--warmup_steps="1000" \
     --lr_scheduler_type="linear" \
     --feat_proj_dropout="0.1" \
     --attention_dropout="0.1" \
@@ -18,8 +18,8 @@ python run_speech_recognition_ctc.py \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--length_column_name="input_length" \
-	--save_steps="1000" \
-	--eval_steps="400" \
 	--layerdrop="0.0" \
 	--save_total_limit="2" \
 	--freeze_feature_encoder \

 	--dataset_config_name="el" \
 	--output_dir="./" \
 	--overwrite_output_dir \
+	--num_train_epochs="80" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="2" \
 	--learning_rate="5e-5" \
+	--warmup_steps="400" \
     --lr_scheduler_type="linear" \
     --feat_proj_dropout="0.1" \
     --attention_dropout="0.1" \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--length_column_name="input_length" \
+	--save_steps="500" \
+	--eval_steps="500" \
 	--layerdrop="0.0" \
 	--save_total_limit="2" \
 	--freeze_feature_encoder \

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0f5416c25274021c86ac8b1598fd021bfae47e384c96367caf69013bad81241f
 size 1262132785

 version https://git-lfs.github.com/spec/v1
+oid sha256:fbcdd6e77557731974267ab6f87f16eb50dc8e354267250c951df02997cc6db0
 size 1262132785

run.sh CHANGED Viewed

@@ -4,7 +4,7 @@ python run_speech_recognition_ctc.py \
 	--dataset_config_name="el" \
 	--output_dir="./" \
 	--overwrite_output_dir \
-	--num_train_epochs="40" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="2" \
 	--learning_rate="5e-5" \
@@ -18,8 +18,8 @@ python run_speech_recognition_ctc.py \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--length_column_name="input_length" \
-	--save_steps="1000" \
-	--eval_steps="400" \
 	--layerdrop="0.0" \
 	--save_total_limit="2" \
 	--freeze_feature_encoder \

 	--dataset_config_name="el" \
 	--output_dir="./" \
 	--overwrite_output_dir \
+	--num_train_epochs="80" \
 	--per_device_train_batch_size="32" \
 	--gradient_accumulation_steps="2" \
 	--learning_rate="5e-5" \
 	--evaluation_strategy="steps" \
 	--text_column_name="sentence" \
 	--length_column_name="input_length" \
+	--save_steps="500" \
+	--eval_steps="500" \
 	--layerdrop="0.0" \
 	--save_total_limit="2" \
 	--freeze_feature_encoder \

special_tokens_map.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}

+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:319739be0b8c57a290a35449f4033858ca110fe3f2f3563987386ce1d776afec
 size 2991

 version https://git-lfs.github.com/spec/v1
+oid sha256:2cdb010419a9871a35ab482d0abfa3068a8f870c9ba360d2ea0173560ab60642
 size 2991

wandb/debug-internal.log CHANGED Viewed

	@@ -1 +1 @@
1	- run-~~20220204_152118~~-~~2dc06ifr~~/logs/debug-internal.log


1	+ run-20220204_170031-gzsqxey3/logs/debug-internal.log

wandb/debug.log CHANGED Viewed

	@@ -1 +1 @@
1	- run-~~20220204_152118~~-~~2dc06ifr~~/logs/debug.log


1	+ run-20220204_170031-gzsqxey3/logs/debug.log

wandb/latest-run CHANGED Viewed

	@@ -1 +1 @@
1	- run-~~20220204_152118~~-~~2dc06ifr~~


1	+ run-20220204_170031-gzsqxey3

wandb/run-20220204_152118-2dc06ifr/files/output.log CHANGED Viewed

@@ -2129,3 +2129,13 @@ Configuration saved in ./preprocessor_config.json
 Configuration saved in ./checkpoint-2000/config.json
 Model weights saved in ./checkpoint-2000/pytorch_model.bin
 Configuration saved in ./checkpoint-2000/preprocessor_config.json

 Configuration saved in ./checkpoint-2000/config.json
 Model weights saved in ./checkpoint-2000/pytorch_model.bin
 Configuration saved in ./checkpoint-2000/preprocessor_config.json
+Configuration saved in ./preprocessor_config.json

wandb/run-20220204_152118-2dc06ifr/logs/debug-internal.log CHANGED Viewed

@@ -4337,3 +4337,38 @@
 2022-02-04 16:58:14,679 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
 2022-02-04 16:58:29,844 DEBUG   HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
 2022-02-04 16:58:29,845 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status

 2022-02-04 16:58:14,679 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
 2022-02-04 16:58:29,844 DEBUG   HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
 2022-02-04 16:58:29,845 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
+2022-02-04 16:58:38,298 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:39,288 DEBUG   SenderThread:583863 [sender.py:send():234] send: stats
+2022-02-04 16:58:41,300 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:43,303 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:45,015 DEBUG   HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
+2022-02-04 16:58:45,015 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
+2022-02-04 16:58:47,305 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:49,307 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:51,308 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:53,309 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:58:55,310 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:59:00,175 DEBUG   HandlerThread:583863 [handler.py:handle_request():130] handle_request: stop_status
+2022-02-04 16:59:00,175 DEBUG   SenderThread:583863 [sender.py:send_request():248] send_request: stop_status
+2022-02-04 16:59:01,313 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:59:04,716 WARNING MainThread:583863 [internal.py:wandb_internal():146] Internal process interrupt: 1
+2022-02-04 16:59:05,315 INFO    Thread-8  :583863 [dir_watcher.py:_on_file_modified():230] file/dir modified: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:59:05,510 WARNING MainThread:583863 [internal.py:wandb_internal():146] Internal process interrupt: 2
+2022-02-04 16:59:05,510 ERROR   MainThread:583863 [internal.py:wandb_internal():149] Internal process interrupted.
+2022-02-04 16:59:06,493 INFO    SenderThread:583863 [sender.py:finish():1070] shutting down sender
+2022-02-04 16:59:06,493 INFO    WriterThread:583863 [datastore.py:close():281] close: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb
+2022-02-04 16:59:06,494 INFO    SenderThread:583863 [dir_watcher.py:finish():283] shutting down directory watcher
+2022-02-04 16:59:07,317 INFO    SenderThread:583863 [dir_watcher.py:finish():313] scan: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files
+2022-02-04 16:59:07,318 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-metadata.json wandb-metadata.json
+2022-02-04 16:59:07,318 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log output.log
+2022-02-04 16:59:07,318 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/requirements.txt requirements.txt
+2022-02-04 16:59:07,348 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-summary.json wandb-summary.json
+2022-02-04 16:59:07,354 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/config.yaml config.yaml
+2022-02-04 16:59:07,356 INFO    SenderThread:583863 [dir_watcher.py:finish():327] scan save: /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/conda-environment.yaml conda-environment.yaml
+2022-02-04 16:59:07,366 INFO    SenderThread:583863 [file_pusher.py:finish():177] shutting down file pusher
+2022-02-04 16:59:07,367 INFO    SenderThread:583863 [file_pusher.py:join():182] waiting for file pusher
+2022-02-04 16:59:07,895 INFO    Thread-12 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/output.log
+2022-02-04 16:59:07,991 INFO    Thread-13 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/requirements.txt
+2022-02-04 16:59:08,129 INFO    Thread-14 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/wandb-summary.json
+2022-02-04 16:59:08,134 INFO    Thread-15 :583863 [upload_job.py:push():137] Uploaded file /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_152118-2dc06ifr/files/config.yaml
+2022-02-04 16:59:08,848 INFO    MainThread:583863 [internal.py:handle_exit():77] Internal process exited

wandb/run-20220204_152118-2dc06ifr/logs/debug.log CHANGED Viewed

@@ -24,3 +24,5 @@ config: {}
 2022-02-04 15:21:20,512 INFO    MainThread:582896 [wandb_init.py:init():633] run started, returning control to user process
 2022-02-04 15:21:20,515 INFO    MainThread:582896 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 40.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_15-19-01_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 1000, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 400, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
 2022-02-04 15:21:20,519 INFO    MainThread:582896 [wandb_watch.py:watch():43] Watching

 2022-02-04 15:21:20,512 INFO    MainThread:582896 [wandb_init.py:init():633] run started, returning control to user process
 2022-02-04 15:21:20,515 INFO    MainThread:582896 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 40.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_15-19-01_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 1000, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 400, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
 2022-02-04 15:21:20,519 INFO    MainThread:582896 [wandb_watch.py:watch():43] Watching
+2022-02-04 16:59:04,749 INFO    MainThread:582896 [wandb_run.py:_atexit_cleanup():1780] got exitcode: 255
+2022-02-04 16:59:04,751 INFO    MainThread:582896 [wandb_run.py:_restore():1752] restore

wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb CHANGED Viewed

Binary files a/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb and b/wandb/run-20220204_152118-2dc06ifr/run-2dc06ifr.wandb differ

wandb/run-20220204_170031-gzsqxey3/files/conda-environment.yaml ADDED Viewed

File without changes

wandb/run-20220204_170031-gzsqxey3/files/config.yaml ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20220204_170031-gzsqxey3/files/output.log ADDED Viewed

	@@ -0,0 +1,533 @@

+ 11%|███████                                                         | 499/4560 [23:43<3:19:11,  2.94s/it]
+ 11%|███████                                                         | 500/4560 [23:47<3:44:34,  3.32s/it]The following columns in the evaluation set  don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
+***** Running Evaluation *****
+  Num examples = 1681
+  Batch size = 8
+Configuration saved in ./checkpoint-500/config.json
+{'eval_loss': 3.128021001815796, 'eval_wer': 1.0, 'eval_runtime': 61.7966, 'eval_samples_per_second': 27.202, 'eval_steps_per_second': 3.414, 'epoch': 8.77}
+Model weights saved in ./checkpoint-500/pytorch_model.bin
+Configuration saved in ./checkpoint-500/preprocessor_config.json

wandb/run-20220204_170031-gzsqxey3/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,171 @@

+-atasets==1.17.1.dev0
+-ransformers==4.16.0.dev0
+aiohttp==3.8.1
+aiosignal==1.2.0
+analytics-python==1.4.0
+appdirs==1.4.4
+argon2-cffi==20.1.0
+async-generator==1.10
+async-timeout==4.0.2
+attrs==21.1.0
+audioread==2.1.9
+backcall==0.2.0
+backoff==1.10.0
+bcrypt==3.2.0
+beautifulsoup4==4.9.3
+bleach==3.3.0
+brotlipy==0.7.0
+certifi==2020.12.5
+cffi==1.14.3
+chardet==3.0.4
+charset-normalizer==2.0.10
+click==8.0.3
+conda-build==3.21.4
+conda-package-handling==1.7.2
+conda==4.9.2
+configparser==5.2.0
+cryptography==3.2.1
+cycler==0.11.0
+datasets==1.18.3
+decorator==4.4.2
+defusedxml==0.7.1
+dill==0.3.4
+dnspython==2.1.0
+docker-pycreds==0.4.0
+entrypoints==0.3
+ffmpy==0.3.0
+filelock==3.0.12
+flask-cachebuster==1.0.0
+flask-cors==3.0.10
+flask-login==0.5.0
+flask==2.0.2
+fonttools==4.28.5
+frozenlist==1.3.0
+fsspec==2022.1.0
+gitdb==4.0.9
+gitpython==3.1.26
+glob2==0.7
+gradio==2.7.0
+huggingface-hub==0.4.0
+hypothesis==6.36.1
+idna==2.10
+ipykernel==5.5.4
+ipython-genutils==0.2.0
+ipython==7.21.0
+ipywidgets==7.6.3
+itsdangerous==2.0.1
+jedi==0.17.0
+jinja2==3.0.3
+jiwer==2.3.0
+joblib==1.1.0
+json5==0.9.5
+jsonschema==3.2.0
+jupyter-client==6.1.12
+jupyter-core==4.7.1
+jupyterlab-pygments==0.1.2
+jupyterlab-server==1.2.0
+jupyterlab-widgets==1.0.0
+jupyterlab==2.2.9
+kenlm==0.0.0
+kiwisolver==1.3.2
+libarchive-c==2.9
+librosa==0.8.1
+llvmlite==0.38.0
+markdown2==2.4.2
+markupsafe==2.0.1
+matplotlib==3.5.1
+mistune==0.8.4
+mkl-fft==1.3.0
+mkl-random==1.1.1
+mkl-service==2.3.0
+monotonic==1.6
+multidict==5.2.0
+multiprocess==0.70.12.2
+nano==0.10.0
+nbclient==0.5.3
+nbconvert==6.0.7
+nbformat==5.1.3
+nest-asyncio==1.5.1
+notebook==6.3.0
+numba==0.55.0
+numpy==1.19.2
+olefile==0.46
+packaging==20.9
+pandas==1.3.5
+pandocfilters==1.4.3
+paramiko==2.9.2
+parso==0.8.1
+pathtools==0.1.2
+pexpect==4.8.0
+pickleshare==0.7.5
+pillow==8.1.2
+pip==21.3.1
+pkginfo==1.7.0
+pooch==1.5.2
+prometheus-client==0.10.1
+promise==2.3
+prompt-toolkit==3.0.8
+protobuf==3.19.3
+psutil==5.8.0
+ptyprocess==0.7.0
+pyarrow==6.0.1
+pycosat==0.6.3
+pycparser==2.20
+pycryptodome==3.12.0
+pyctcdecode==0.3.0
+pydub==0.25.1
+pygments==2.8.0
+pygtrie==2.4.2
+pynacl==1.5.0
+pyopenssl==19.1.0
+pyparsing==2.4.7
+pyrsistent==0.17.3
+pysocks==1.7.1
+python-dateutil==2.8.1
+python-etcd==0.4.5
+python-levenshtein==0.12.2
+pytz==2021.1
+pyyaml==5.4.1
+pyzmq==22.0.3
+regex==2022.1.18
+requests==2.24.0
+resampy==0.2.2
+ruamel-yaml==0.15.87
+sacremoses==0.0.47
+scikit-learn==1.0.2
+scipy==1.7.3
+send2trash==1.5.0
+sentry-sdk==1.5.4
+setuptools==50.3.1.post20201107
+shortuuid==1.0.8
+six==1.15.0
+smmap==5.0.0
+sortedcontainers==2.4.0
+soundfile==0.10.3.post1
+soupsieve==2.2
+subprocess32==3.5.4
+termcolor==1.1.0
+terminado==0.9.4
+testpath==0.4.4
+threadpoolctl==3.0.0
+tokenizers==0.11.4
+torch==1.10.1
+torchaudio==0.10.1
+torchelastic==0.2.2
+torchtext==0.9.1
+torchvision==0.9.1
+tornado==6.1
+tqdm==4.62.3
+traitlets==5.0.5
+transformers==4.17.0.dev0
+typing-extensions==3.7.4.3
+urllib3==1.25.11
+wandb==0.12.9
+wcwidth==0.2.5
+webencodings==0.5.1
+werkzeug==2.0.2
+wheel==0.35.1
+widgetsnbextension==3.5.1
+xxhash==2.0.2
+yarl==1.7.2
+yaspin==2.1.0

wandb/run-20220204_170031-gzsqxey3/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+    "os": "Linux-5.11.0-37-generic-x86_64-with-glibc2.10",
+    "python": "3.8.8",
+    "heartbeatAt": "2022-02-04T17:00:32.947275",
+    "startedAt": "2022-02-04T17:00:31.683578",
+    "docker": null,
+    "gpu": "Tesla V100S-PCIE-32GB",
+    "gpu_count": 1,
+    "cpu_count": 60,
+    "cuda": null,
+    "args": [
+        "--dataset_name=mozilla-foundation/common_voice_8_0",
+        "--model_name_or_path=facebook/wav2vec2-xls-r-300m",
+        "--dataset_config_name=el",
+        "--output_dir=./",
+        "--overwrite_output_dir",
+        "--num_train_epochs=80",
+        "--per_device_train_batch_size=32",
+        "--gradient_accumulation_steps=2",
+        "--learning_rate=5e-5",
+        "--warmup_steps=400",
+        "--lr_scheduler_type=linear",
+        "--feat_proj_dropout=0.1",
+        "--attention_dropout=0.1",
+        "--max_duration_in_seconds=15",
+        "--mask_time_prob=0.4",
+        "--mask_feature_prob=0.1",
+        "--evaluation_strategy=steps",
+        "--text_column_name=sentence",
+        "--length_column_name=input_length",
+        "--save_steps=500",
+        "--eval_steps=500",
+        "--layerdrop=0.0",
+        "--save_total_limit=2",
+        "--freeze_feature_encoder",
+        "--gradient_checkpointing",
+        "--fp16",
+        "--push_to_hub",
+        "--group_by_length",
+        "--do_train",
+        "--do_eval"
+    ],
+    "state": "running",
+    "program": "run_speech_recognition_ctc.py",
+    "codePath": "run_speech_recognition_ctc.py",
+    "git": {
+        "remote": "https://huggingface.co/ayameRushia/wav2vec2-large-xls-r-300m-el",
+        "commit": "dc39b02954010cda629c3aadbcb5e0ab724f8d16"
+    },
+    "email": "magunghambali@gmail.com",
+    "root": "/workspace/wav2vec2-large-xls-r-300m-el",
+    "host": "job-1c325595-1ca8-441f-8e94-43b2937c71d2",
+    "username": "ovh",
+    "executable": "/opt/conda/bin/python"
+}

wandb/run-20220204_170031-gzsqxey3/files/wandb-summary.json ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20220204_170031-gzsqxey3/logs/debug-internal.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20220204_170031-gzsqxey3/logs/debug.log ADDED Viewed

	@@ -0,0 +1,26 @@

+2022-02-04 17:00:31,686 INFO    MainThread:622234 [wandb_setup.py:_flush():71] Unhandled environment var: WANDB_RUN
+2022-02-04 17:00:31,686 INFO    MainThread:622234 [wandb_setup.py:_flush():71] setting env: {'project': 'wav2vec2-mn-1', 'run_name': 'run dataset 1.18.3'}
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_setup.py:_flush():71] setting login settings: {}
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_init.py:_log_setup():371] Logging user logs to /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_170031-gzsqxey3/logs/debug.log
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_init.py:_log_setup():372] Logging internal logs to /workspace/wav2vec2-large-xls-r-300m-el/wandb/run-20220204_170031-gzsqxey3/logs/debug-internal.log
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_init.py:init():404] calling init triggers
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_init.py:init():409] wandb.init called with sweep_config: {}
+config: {}
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [wandb_init.py:init():460] starting backend
+2022-02-04 17:00:31,687 INFO    MainThread:622234 [backend.py:_multiprocessing_setup():99] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2022-02-04 17:00:31,762 INFO    MainThread:622234 [backend.py:ensure_launched():216] starting backend process...
+2022-02-04 17:00:31,853 INFO    MainThread:622234 [backend.py:ensure_launched():221] started backend process with pid: 622748
+2022-02-04 17:00:31,856 INFO    MainThread:622234 [wandb_init.py:init():469] backend started and connected
+2022-02-04 17:00:31,866 INFO    MainThread:622234 [wandb_init.py:init():533] updated telemetry
+2022-02-04 17:00:32,016 INFO    MainThread:622234 [wandb_init.py:init():563] communicating current version
+2022-02-04 17:00:32,744 INFO    MainThread:622234 [wandb_init.py:init():568] got version response upgrade_message: "wandb version 0.12.10 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2022-02-04 17:00:32,744 INFO    MainThread:622234 [wandb_init.py:init():578] communicating run to backend with 30 second timeout
+2022-02-04 17:00:32,936 INFO    MainThread:622234 [wandb_init.py:init():606] starting run threads in backend
+2022-02-04 17:00:33,569 INFO    MainThread:622234 [wandb_run.py:_console_start():1810] atexit reg
+2022-02-04 17:00:33,570 INFO    MainThread:622234 [wandb_run.py:_redirect():1684] redirect: SettingsConsole.REDIRECT
+2022-02-04 17:00:33,571 INFO    MainThread:622234 [wandb_run.py:_redirect():1689] Redirecting console.
+2022-02-04 17:00:33,575 INFO    MainThread:622234 [wandb_run.py:_redirect():1745] Redirects installed.
+2022-02-04 17:00:33,575 INFO    MainThread:622234 [wandb_init.py:init():633] run started, returning control to user process
+2022-02-04 17:00:33,579 INFO    MainThread:622234 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 48, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.17.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.1, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 51, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.4, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.1, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 32, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 80.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 400, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Feb04_16-59-26_job-1c325595-1ca8-441f-8e94-43b2937c71d2', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 500, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 2, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 32, 'eval_batch_size': 8}
+2022-02-04 17:00:33,583 INFO    MainThread:622234 [wandb_watch.py:watch():43] Watching

wandb/run-20220204_170031-gzsqxey3/run-gzsqxey3.wandb ADDED Viewed

Binary file (803 kB). View file