End of training

Browse files

Files changed (6) hide show

README.md +121 -0
config.json +118 -0
model.safetensors +3 -0
preprocessor_config.json +9 -0
runs/Nov27_09-31-34_7fadf3e13014/events.out.tfevents.1701077777.7fadf3e13014.1082.0 +3 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,121 @@

+---
+license: apache-2.0
+base_model: facebook/wav2vec2-base
+tags:
+- generated_from_trainer
+metrics:
+- wer
+model-index:
+- name: wav2vec2-1
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# wav2vec2-1
+This model is a fine-tuned version of [facebook/wav2vec2-base](https://huggingface.co/facebook/wav2vec2-base) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.8870
+- Wer: 0.3805
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- lr_scheduler_warmup_steps: 1000
+- num_epochs: 30
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch | Step  | Validation Loss | Wer    |
+|:-------------:|:-----:|:-----:|:---------------:|:------:|
+| 4.6457        | 0.5   | 500   | 2.8866          | 0.9999 |
+| 2.863         | 1.0   | 1000  | 2.8676          | 1.0    |
+| 1.8085        | 1.5   | 1500  | 0.9396          | 0.6602 |
+| 0.8828        | 2.0   | 2000  | 0.7278          | 0.5699 |
+| 0.6659        | 2.5   | 2500  | 0.7000          | 0.5401 |
+| 0.6085        | 3.0   | 3000  | 0.7143          | 0.4939 |
+| 0.4878        | 3.5   | 3500  | 0.5845          | 0.4717 |
+| 0.4888        | 4.0   | 4000  | 0.6201          | 0.4677 |
+| 0.4022        | 4.5   | 4500  | 0.5984          | 0.4532 |
+| 0.3947        | 5.0   | 5000  | 0.5874          | 0.4378 |
+| 0.3415        | 5.5   | 5500  | 0.6486          | 0.4405 |
+| 0.3413        | 6.0   | 6000  | 0.5988          | 0.4355 |
+| 0.2903        | 6.5   | 6500  | 0.6584          | 0.4304 |
+| 0.3046        | 7.0   | 7000  | 0.6602          | 0.4189 |
+| 0.2625        | 7.5   | 7500  | 0.5924          | 0.4235 |
+| 0.2625        | 8.0   | 8000  | 0.6541          | 0.4212 |
+| 0.2341        | 8.5   | 8500  | 0.6365          | 0.4171 |
+| 0.2384        | 9.0   | 9000  | 0.6095          | 0.4182 |
+| 0.2052        | 9.5   | 9500  | 0.6675          | 0.4091 |
+| 0.2124        | 10.0  | 10000 | 0.6524          | 0.4110 |
+| 0.1915        | 10.5  | 10500 | 0.6877          | 0.4122 |
+| 0.1922        | 11.0  | 11000 | 0.6857          | 0.4122 |
+| 0.1719        | 11.5  | 11500 | 0.6881          | 0.4056 |
+| 0.1811        | 12.0  | 12000 | 0.6832          | 0.4083 |
+| 0.1554        | 12.5  | 12500 | 0.7378          | 0.4103 |
+| 0.163         | 13.0  | 13000 | 0.6940          | 0.4019 |
+| 0.1452        | 13.5  | 13500 | 0.6811          | 0.3993 |
+| 0.1457        | 14.0  | 14000 | 0.7216          | 0.4007 |
+| 0.1319        | 14.5  | 14500 | 0.7243          | 0.3996 |
+| 0.1367        | 15.0  | 15000 | 0.7332          | 0.4006 |
+| 0.118         | 15.5  | 15500 | 0.7609          | 0.4050 |
+| 0.121         | 16.0  | 16000 | 0.7585          | 0.4021 |
+| 0.1096        | 16.5  | 16500 | 0.7583          | 0.4003 |
+| 0.112         | 17.0  | 17000 | 0.7928          | 0.4011 |
+| 0.1063        | 17.5  | 17500 | 0.7794          | 0.4038 |
+| 0.1009        | 18.0  | 18000 | 0.7474          | 0.3982 |
+| 0.0931        | 18.5  | 18500 | 0.8143          | 0.3980 |
+| 0.0943        | 19.0  | 19000 | 0.7873          | 0.4000 |
+| 0.0847        | 19.5  | 19500 | 0.8064          | 0.3991 |
+| 0.0831        | 20.0  | 20000 | 0.8564          | 0.3967 |
+| 0.0821        | 20.5  | 20500 | 0.8632          | 0.3956 |
+| 0.0807        | 21.0  | 21000 | 0.8250          | 0.3928 |
+| 0.0748        | 21.5  | 21500 | 0.8389          | 0.3949 |
+| 0.0751        | 22.0  | 22000 | 0.8355          | 0.3943 |
+| 0.072         | 22.5  | 22500 | 0.8568          | 0.3930 |
+| 0.0696        | 23.0  | 23000 | 0.8396          | 0.3912 |
+| 0.0678        | 23.5  | 23500 | 0.8634          | 0.3901 |
+| 0.0671        | 24.0  | 24000 | 0.8576          | 0.3880 |
+| 0.063         | 24.5  | 24500 | 0.8303          | 0.3876 |
+| 0.0575        | 25.0  | 25000 | 0.9125          | 0.3847 |
+| 0.0572        | 25.5  | 25500 | 0.8745          | 0.3839 |
+| 0.0572        | 26.0  | 26000 | 0.8714          | 0.3844 |
+| 0.0533        | 26.5  | 26500 | 0.8824          | 0.3840 |
+| 0.0496        | 27.0  | 27000 | 0.8993          | 0.3830 |
+| 0.0525        | 27.5  | 27500 | 0.8818          | 0.3830 |
+| 0.0514        | 28.0  | 28000 | 0.8874          | 0.3819 |
+| 0.0464        | 28.5  | 28500 | 0.8947          | 0.3802 |
+| 0.0473        | 29.0  | 29000 | 0.9028          | 0.3805 |
+| 0.048         | 29.5  | 29500 | 0.8899          | 0.3801 |
+| 0.0458        | 30.0  | 30000 | 0.8870          | 0.3805 |
+### Framework versions
+- Transformers 4.35.2
+- Pytorch 2.1.0+cu118
+- Datasets 2.15.0
+- Tokenizers 0.15.0

config.json ADDED Viewed

	@@ -0,0 +1,118 @@

+{
+  "_name_or_path": "facebook/wav2vec2-base",
+  "activation_dropout": 0.0,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 256,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": false,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "freeze_feat_extract_train": true,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.05,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "no_mask_channel_overlap": false,
+  "no_mask_time_overlap": false,
+  "num_adapter_layers": 3,
+  "num_attention_heads": 12,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "num_negatives": 100,
+  "output_hidden_size": 768,
+  "pad_token_id": 29,
+  "proj_codevector_dim": 256,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32,
+  "xvector_output_dim": 512
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24ea676405fbab0744e6781a2dc920360b45152d8b72e34a2ca98f289fdf72a9
+size 377611120

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0.0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

runs/Nov27_09-31-34_7fadf3e13014/events.out.tfevents.1701077777.7fadf3e13014.1082.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82e7b93ba16dee0c02809bbe41d3c22d64323ed5c7ee910bd0e3ce251b25aa4b
+size 35007

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c64a5c46c2063c6551945a069e05211bd2e8c26f274dbb6dbe94fd26051650a2
+size 4536