sanchit-gandhi's picture
Saving weights and logs of epoch 0
4f730f1
03/23/2022 18:02:15 - WARNING - datasets.builder - Reusing dataset librispeech_asr (/home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25)
03/23/2022 18:02:15 - WARNING - datasets.builder - Reusing dataset librispeech_asr (/home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25)
loading configuration file ./config.json
Model config SpeechEncoderDecoderConfig {
"_name_or_path": "./",
"architectures": [
"SpeechEncoderDecoderModel"
],
"cache_dir": "/home/sanchit_huggingface_co/cache/huggingface/transformers",
"decoder": {
"_name_or_path": "facebook/bart-large-cnn",
"_num_labels": 3,
"activation_dropout": 0.0,
"activation_function": "gelu",
"add_cross_attention": true,
"add_final_layer_norm": false,
"architectures": [
"BartForConditionalGeneration"
],
"attention_dropout": 0.0,
"bad_words_ids": null,
"bos_token_id": 0,
"chunk_size_feed_forward": 0,
"classif_dropout": 0.0,
"classifier_dropout": 0.0,
"cross_attention_hidden_size": null,
"d_model": 1024,
"decoder_attention_heads": 16,
"decoder_ffn_dim": 4096,
"decoder_layerdrop": 0.0,
"decoder_layers": 12,
"decoder_start_token_id": 2,
"diversity_penalty": 0.0,
"do_sample": false,
"dropout": 0.1,
"early_stopping": true,
"encoder_attention_heads": 16,
"encoder_ffn_dim": 4096,
"encoder_layerdrop": 0.0,
"encoder_layers": 12,
"encoder_no_repeat_ngram_size": 0,
"eos_token_id": 2,
"exponential_decay_length_penalty": null,
"finetuning_task": null,
"force_bos_token_to_be_generated": true,
"forced_bos_token_id": 0,
"forced_eos_token_id": 2,
"gradient_checkpointing": false,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1",
"2": "LABEL_2"
},
"init_std": 0.02,
"is_decoder": true,
"is_encoder_decoder": false,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2
},
"length_penalty": 2.0,
"max_length": 142,
"max_position_embeddings": 1024,
"min_length": 56,
"model_type": "bart",
"no_repeat_ngram_size": 3,
"normalize_before": false,
"num_beam_groups": 1,
"num_beams": 4,
"num_hidden_layers": 12,
"num_return_sequences": 1,
"output_attentions": false,
"output_hidden_states": false,
"output_past": true,
"output_scores": false,
"pad_token_id": 1,
"prefix": " ",
"problem_type": null,
"pruned_heads": {},
"remove_invalid_values": false,
"repetition_penalty": 1.0,
"return_dict": true,
"return_dict_in_generate": false,
"scale_embedding": false,
"sep_token_id": null,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 142,
"min_length": 56,
"no_repeat_ngram_size": 3,
"num_beams": 4
}
},
"temperature": 1.0,
"tie_encoder_decoder": false,
"tie_word_embeddings": true,
"tokenizer_class": null,
"top_k": 50,
"top_p": 1.0,
"torch_dtype": null,
"torchscript": false,
"transformers_version": "4.18.0.dev0",
"typical_p": 1.0,
"use_bfloat16": false,
"use_cache": true,
"vocab_size": 50264
},
"decoder_start_token_id": 0,
"encoder": {
"_name_or_path": "facebook/wav2vec2-large-lv60",
"activation_dropout": 0.1,
"adapter_kernel_size": 3,
"adapter_stride": 2,
"add_adapter": true,
"add_cross_attention": false,
"apply_spec_augment": true,
"architectures": [
"Wav2Vec2ForPreTraining"
],
"attention_dropout": 0.1,
"bad_words_ids": null,
"bos_token_id": 1,
"chunk_size_feed_forward": 0,
"classifier_proj_size": 256,
"codevector_dim": 768,
"contrastive_logits_temperature": 0.1,
"conv_bias": true,
"conv_dim": [
512,
512,
512,
512,
512,
512,
512
],
"conv_kernel": [
10,
3,
3,
3,
3,
2,
2
],
"conv_stride": [
5,
2,
2,
2,
2,
2,
2
],
"cross_attention_hidden_size": null,
"ctc_loss_reduction": "sum",
"ctc_zero_infinity": false,
"decoder_start_token_id": null,
"diversity_loss_weight": 0.1,
"diversity_penalty": 0.0,
"do_sample": false,
"do_stable_layer_norm": true,
"early_stopping": false,
"encoder_no_repeat_ngram_size": 0,
"eos_token_id": 2,
"exponential_decay_length_penalty": null,
"feat_extract_activation": "gelu",
"feat_extract_dropout": 0.0,
"feat_extract_norm": "layer",
"feat_proj_dropout": 0.0,
"feat_quantizer_dropout": 0.0,
"final_dropout": 0.0,
"finetuning_task": null,
"forced_bos_token_id": null,
"forced_eos_token_id": null,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout": 0.1,
"hidden_dropout_prob": 0.1,
"hidden_size": 1024,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"is_decoder": false,
"is_encoder_decoder": false,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1
},
"layer_norm_eps": 1e-05,
"layerdrop": 0.0,
"length_penalty": 1.0,
"mask_feature_length": 10,
"mask_feature_min_masks": 0,
"mask_feature_prob": 0.0,
"mask_time_length": 10,
"mask_time_min_masks": 2,
"mask_time_prob": 0.1,
"max_length": 20,
"min_length": 0,
"model_type": "wav2vec2",
"no_repeat_ngram_size": 0,
"num_adapter_layers": 3,
"num_attention_heads": 16,
"num_beam_groups": 1,
"num_beams": 1,
"num_codevector_groups": 2,
"num_codevectors_per_group": 320,
"num_conv_pos_embedding_groups": 16,
"num_conv_pos_embeddings": 128,
"num_feat_extract_layers": 7,
"num_hidden_layers": 24,
"num_negatives": 100,
"num_return_sequences": 1,
"output_attentions": false,
"output_hidden_size": 1024,
"output_hidden_states": false,
"output_scores": false,
"pad_token_id": 0,
"prefix": null,
"problem_type": null,
"proj_codevector_dim": 768,
"pruned_heads": {},
"remove_invalid_values": false,
"repetition_penalty": 1.0,
"return_dict": true,
"return_dict_in_generate": false,
"sep_token_id": null,
"task_specific_params": null,
"tdnn_dilation": [
1,
2,
3,
1,
1
],
"tdnn_dim": [
512,
512,
512,
512,
1500
],
"tdnn_kernel": [
5,
3,
3,
1,
1
],
"temperature": 1.0,
"tie_encoder_decoder": false,
"tie_word_embeddings": true,
"tokenizer_class": null,
"top_k": 50,
"top_p": 1.0,
"torch_dtype": null,
"torchscript": false,
"transformers_version": "4.18.0.dev0",
"typical_p": 1.0,
"use_bfloat16": false,
"use_weighted_layer_sum": false,
"vocab_size": 32,
"xvector_output_dim": 512
},
"eos_token_id": 2,
"is_encoder_decoder": true,
"max_length": 40,
"model_type": "speech-encoder-decoder",
"pad_token_id": 1,
"processor_class": "Wav2Vec2Processor",
"transformers_version": null,
"use_cache": false
}
loading feature extractor configuration file ./preprocessor_config.json
Feature extractor Wav2Vec2FeatureExtractor {
"do_normalize": true,
"feature_extractor_type": "Wav2Vec2FeatureExtractor",
"feature_size": 1,
"padding_side": "right",
"padding_value": 0.0,
"return_attention_mask": true,
"sampling_rate": 16000
}
Didn't find file ./added_tokens.json. We won't load it.
loading file ./vocab.json
loading file ./merges.txt
loading file ./tokenizer.json
loading file None
loading file ./special_tokens_map.json
loading file ./tokenizer_config.json
loading weights file ./flax_model.msgpack
tcmalloc: large alloc 2353643520 bytes == 0x96e34000 @ 0x7f92b0d7d680 0x7f92b0d9e824 0x5f9ec1 0x649811 0x5c4706 0x4f2c4e 0x6501b8 0x504be3 0x56b5e0 0x5696da 0x5f6403 0x50b271 0x5f55f2 0x56cbfb 0x5696da 0x50add0 0x56c5d1 0x5696da 0x5f6403 0x56b3fe 0x5696da 0x68db17 0x67eeb1 0x67ef2f 0x67efd1 0x67f377 0x6b7902 0x6b7c8d 0x7f92b0b910b3 0x5fb12e
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea15d97b9566d103.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-d7fc571278966c76.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-4965e6e979b2b60b.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-8a47bb6f96f32026.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-cbbe1288df13cab7.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-b2269d84247a33b4.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-8bb3e3321558a7fe.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-7fca762335ab1cb3.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-05ecf5d454b27d4c.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-997bee0e4ee82287.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-38358ff6a9f589a1.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-c9efc32c2d772ecc.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-aac567c0d49b9306.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-b56ddb8551754afc.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9fd80e6a76a5c81d.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-4b6374f1e99ab634.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-68ddf7581351ecc6.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-f2cf0710b724a5f2.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-44af87c7b0820e05.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ba5d520ccccec157.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-19fa7abaf3b91fad.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6bcf29dd446af266.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-1251ad556665a7a6.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-994a8fe7d263f650.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-75cd8234878cd5c4.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a067d3c7a8914aa8.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-bf947cc62d7008e0.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-147583e7c14ed101.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9ed1c08ef2966ee4.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-f74f5ab629122ac5.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9beeeed44badf1ee.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-e998c5138e26cd17.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00000_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00001_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00002_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00003_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00004_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00005_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00006_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00007_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00008_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00009_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00010_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00011_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00012_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00013_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00014_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-a0e04d4db6254683_00015_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00000_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00001_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00002_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00003_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00004_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00005_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00006_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00007_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00008_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00009_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00010_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00011_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00012_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00013_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00014_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-9d1cc78efd8c6a64_00015_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00000_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00001_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00002_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00003_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00004_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00005_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00006_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00007_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00008_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00009_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00010_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00011_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00012_of_00016.arrow
All model checkpoint weights were used when initializing FlaxSpeechEncoderDecoderModel.
All the weights of FlaxSpeechEncoderDecoderModel were initialized from the model checkpoint at ./.
If your task is similar to the task the model of the checkpoint was trained on, you can already use FlaxSpeechEncoderDecoderModel for predictions without further training.
Feature extractor saved in ./preprocessor_config.json
tokenizer config file saved in ./tokenizer_config.json
Special tokens file saved in ./special_tokens_map.json
Configuration saved in ./config.json
loading feature extractor configuration file ./preprocessor_config.json
loading configuration file ./config.json
Model config SpeechEncoderDecoderConfig {
"_name_or_path": "./",
"architectures": [
"SpeechEncoderDecoderModel"
],
"cache_dir": "/home/sanchit_huggingface_co/cache/huggingface/transformers",
"decoder": {
"_name_or_path": "facebook/bart-large-cnn",
"_num_labels": 3,
"activation_dropout": 0.0,
"activation_function": "gelu",
"add_cross_attention": true,
"add_final_layer_norm": false,
"architectures": [
"BartForConditionalGeneration"
],
"attention_dropout": 0.0,
"bad_words_ids": null,
"bos_token_id": 0,
"chunk_size_feed_forward": 0,
"classif_dropout": 0.0,
"classifier_dropout": 0.0,
"cross_attention_hidden_size": null,
"d_model": 1024,
"decoder_attention_heads": 16,
"decoder_ffn_dim": 4096,
"decoder_layerdrop": 0.0,
"decoder_layers": 12,
"decoder_start_token_id": 2,
"diversity_penalty": 0.0,
"do_sample": false,
"dropout": 0.1,
"early_stopping": true,
"encoder_attention_heads": 16,
"encoder_ffn_dim": 4096,
"encoder_layerdrop": 0.0,
"encoder_layers": 12,
"encoder_no_repeat_ngram_size": 0,
"eos_token_id": 2,
"exponential_decay_length_penalty": null,
"finetuning_task": null,
"force_bos_token_to_be_generated": true,
"forced_bos_token_id": 0,
"forced_eos_token_id": 2,
"gradient_checkpointing": false,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1",
"2": "LABEL_2"
},
"init_std": 0.02,
"is_decoder": true,
"is_encoder_decoder": false,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2
},
"length_penalty": 2.0,
"max_length": 142,
"max_position_embeddings": 1024,
"min_length": 56,
"model_type": "bart",
"no_repeat_ngram_size": 3,
"normalize_before": false,
"num_beam_groups": 1,
"num_beams": 4,
"num_hidden_layers": 12,
"num_return_sequences": 1,
"output_attentions": false,
"output_hidden_states": false,
"output_past": true,
"output_scores": false,
"pad_token_id": 1,
"prefix": " ",
"problem_type": null,
"pruned_heads": {},
"remove_invalid_values": false,
"repetition_penalty": 1.0,
"return_dict": true,
"return_dict_in_generate": false,
"scale_embedding": false,
"sep_token_id": null,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 142,
"min_length": 56,
"no_repeat_ngram_size": 3,
"num_beams": 4
}
},
"temperature": 1.0,
"tie_encoder_decoder": false,
"tie_word_embeddings": true,
"tokenizer_class": null,
"top_k": 50,
"top_p": 1.0,
"torch_dtype": null,
"torchscript": false,
"transformers_version": "4.18.0.dev0",
"typical_p": 1.0,
"use_bfloat16": false,
"use_cache": true,
"vocab_size": 50264
},
"decoder_start_token_id": 0,
"encoder": {
"_name_or_path": "facebook/wav2vec2-large-lv60",
"activation_dropout": 0.1,
"adapter_kernel_size": 3,
"adapter_stride": 2,
"add_adapter": true,
"add_cross_attention": false,
"apply_spec_augment": true,
"architectures": [
"Wav2Vec2ForPreTraining"
],
"attention_dropout": 0.1,
"bad_words_ids": null,
"bos_token_id": 1,
"chunk_size_feed_forward": 0,
"classifier_proj_size": 256,
"codevector_dim": 768,
"contrastive_logits_temperature": 0.1,
"conv_bias": true,
"conv_dim": [
512,
512,
512,
512,
512,
512,
512
],
"conv_kernel": [
10,
3,
3,
3,
3,
2,
2
],
"conv_stride": [
5,
2,
2,
2,
2,
2,
2
],
"cross_attention_hidden_size": null,
"ctc_loss_reduction": "sum",
"ctc_zero_infinity": false,
"decoder_start_token_id": null,
"diversity_loss_weight": 0.1,
"diversity_penalty": 0.0,
"do_sample": false,
"do_stable_layer_norm": true,
"early_stopping": false,
"encoder_no_repeat_ngram_size": 0,
"eos_token_id": 2,
"exponential_decay_length_penalty": null,
"feat_extract_activation": "gelu",
"feat_extract_dropout": 0.0,
"feat_extract_norm": "layer",
"feat_proj_dropout": 0.0,
"feat_quantizer_dropout": 0.0,
"final_dropout": 0.0,
"finetuning_task": null,
"forced_bos_token_id": null,
"forced_eos_token_id": null,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout": 0.1,
"hidden_dropout_prob": 0.1,
"hidden_size": 1024,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"is_decoder": false,
"is_encoder_decoder": false,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1
},
"layer_norm_eps": 1e-05,
"layerdrop": 0.0,
"length_penalty": 1.0,
"mask_feature_length": 10,
"mask_feature_min_masks": 0,
"mask_feature_prob": 0.0,
"mask_time_length": 10,
"mask_time_min_masks": 2,
"mask_time_prob": 0.1,
"max_length": 20,
"min_length": 0,
"model_type": "wav2vec2",
"no_repeat_ngram_size": 0,
"num_adapter_layers": 3,
"num_attention_heads": 16,
"num_beam_groups": 1,
"num_beams": 1,
"num_codevector_groups": 2,
"num_codevectors_per_group": 320,
"num_conv_pos_embedding_groups": 16,
"num_conv_pos_embeddings": 128,
"num_feat_extract_layers": 7,
"num_hidden_layers": 24,
"num_negatives": 100,
"num_return_sequences": 1,
"output_attentions": false,
"output_hidden_size": 1024,
"output_hidden_states": false,
"output_scores": false,
"pad_token_id": 0,
"prefix": null,
"problem_type": null,
"proj_codevector_dim": 768,
"pruned_heads": {},
"remove_invalid_values": false,
"repetition_penalty": 1.0,
"return_dict": true,
"return_dict_in_generate": false,
"sep_token_id": null,
"task_specific_params": null,
"tdnn_dilation": [
1,
2,
3,
1,
1
],
"tdnn_dim": [
512,
512,
512,
512,
1500
],
"tdnn_kernel": [
5,
3,
3,
1,
1
],
"temperature": 1.0,
"tie_encoder_decoder": false,
"tie_word_embeddings": true,
"tokenizer_class": null,
"top_k": 50,
"top_p": 1.0,
"torch_dtype": null,
"torchscript": false,
"transformers_version": "4.18.0.dev0",
"typical_p": 1.0,
"use_bfloat16": false,
"use_weighted_layer_sum": false,
"vocab_size": 32,
"xvector_output_dim": 512
},
"eos_token_id": 2,
"is_encoder_decoder": true,
"max_length": 40,
"model_type": "speech-encoder-decoder",
"pad_token_id": 1,
"processor_class": "Wav2Vec2Processor",
"transformers_version": null,
"use_cache": false
}
loading feature extractor configuration file ./preprocessor_config.json
Feature extractor Wav2Vec2FeatureExtractor {
"do_normalize": true,
"feature_extractor_type": "Wav2Vec2FeatureExtractor",
"feature_size": 1,
"padding_side": "right",
"padding_value": 0.0,
"return_attention_mask": true,
"sampling_rate": 16000
}
Didn't find file ./added_tokens.json. We won't load it.
loading file ./vocab.json
loading file ./merges.txt
loading file ./tokenizer.json
loading file None
loading file ./special_tokens_map.json
loading file ./tokenizer_config.json
2022-03-23 18:02:36.574326: W tensorflow/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcuda.so.1'; dlerror: libcuda.so.1: cannot open shared object file: No such file or directory
2022-03-23 18:02:36.574364: W tensorflow/stream_executor/cuda/cuda_driver.cc:269] failed call to cuInit: UNKNOWN ERROR (303)
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00013_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00014_of_00016.arrow
03/23/2022 18:02:35 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-6cda192980aa4e0d_00015_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00000_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00001_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00002_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00003_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00004_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00005_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00006_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00007_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00008_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00009_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00010_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00011_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00012_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00013_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00014_of_00016.arrow
03/23/2022 18:02:36 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sanchit_huggingface_co/cache/huggingface/datasets/librispeech_asr/clean/2.1.0/8c6e15bda76db687d2a7c7198808151adecbb4d890ff463033a2e6f788c0ba25/cache-ea385c5194cfd4e8_00015_of_00016.arrow
03/23/2022 18:02:38 - WARNING - huggingface_hub.repository - /home/sanchit_huggingface_co/flax-wav2vec2-2-bart-large-cnn-gradient-accumulation/./ is already a clone of https://huggingface.co/sanchit-gandhi/flax-wav2vec2-2-bart-large-cnn-gradient-accumulation. Make sure you pull the latest changes with `repo.git_pull()`.
/home/sanchit_huggingface_co/flax-wav2vec2-2-bart-large-cnn-gradient-accumulation/./ is already a clone of https://huggingface.co/sanchit-gandhi/flax-wav2vec2-2-bart-large-cnn-gradient-accumulation. Make sure you pull the latest changes with `repo.git_pull()`.
Epoch ... (1/5): 0%| | 0/5 [00:00<?, ?it/s]
03/23/2022 18:02:41 - INFO - __main__ - ***** Running training *****
03/23/2022 18:02:41 - INFO - __main__ - Num examples = 20250
03/23/2022 18:02:41 - INFO - __main__ - Num Epochs = 5
03/23/2022 18:02:41 - INFO - __main__ - Instantaneous batch size per device = 2
03/23/2022 18:02:41 - INFO - __main__ - Total train batch size (w. parallel & distributed) = 16
03/23/2022 18:02:41 - INFO - __main__ - Total optimization steps = 6325
Training...: 0%| | 0/1265 [03:23<?, ?it/s]
Epoch ... (1/5): 0%| | 0/5 [03:28<?, ?it/s]
Traceback (most recent call last):
File "run_flax_speech_recognition_seq2seq.py", line 892, in <module>
main()
File "run_flax_speech_recognition_seq2seq.py", line 819, in main
state, train_metric = p_train_step(state, batch)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/_src/traceback_util.py", line 162, in reraise_with_filtered_traceback
return fun(*args, **kwargs)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/_src/api.py", line 1979, in cache_miss
out_tree, out_flat = f_pmapped_(*args, **kwargs)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/_src/api.py", line 1855, in pmap_f
out = pxla.xla_pmap(
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/core.py", line 1797, in bind
return map_bind(self, fun, *args, **params)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/core.py", line 1828, in map_bind
outs = primitive.process(top_trace, fun, tracers, params)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/core.py", line 1800, in process
return trace.process_map(self, fun, tracers, params)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/core.py", line 614, in process_call
return primitive.impl(f, *tracers, **params)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/interpreters/pxla.py", line 804, in xla_pmap_impl
return compiled_fun(*args)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/_src/profiler.py", line 206, in wrapper
return func(*args, **kwargs)
File "/home/sanchit_huggingface_co/venv/lib/python3.8/site-packages/jax/interpreters/pxla.py", line 1565, in __call__
out_bufs = self.xla_executable.execute_sharded_on_local_devices(input_bufs)
jax._src.traceback_util.UnfilteredStackTrace: RuntimeError: RESOURCE_EXHAUSTED: Attempting to reserve 4.49G at the bottom of memory. That was not possible. There are 6.67G free, 0B reserved, and 4.45G reservable.: while running replica 0 and partition 0 of a replicated computation (other replicas may have failed as well).
The stack trace below excludes JAX-internal frames.
The preceding is the original exception that occurred, unmodified.
--------------------
The above exception was the direct cause of the following exception:
Traceback (most recent call last):
File "run_flax_speech_recognition_seq2seq.py", line 892, in <module>
main()
File "run_flax_speech_recognition_seq2seq.py", line 819, in main
state, train_metric = p_train_step(state, batch)
RuntimeError: RESOURCE_EXHAUSTED: Attempting to reserve 4.49G at the bottom of memory. That was not possible. There are 6.67G free, 0B reserved, and 4.45G reservable.: while running replica 0 and partition 0 of a replicated computation (other replicas may have failed as well).