gopikachu
/

whisper-small-hi

@@ -2,7 +2,7 @@
 language:
 - hi
 license: apache-2.0
-base_model: openai/whisper-large
 tags:
 - generated_from_trainer
 datasets:
@@ -10,7 +10,7 @@ datasets:
 metrics:
 - wer
 model-index:
-- name: Whisper Large Hi - Gopika
   results:
   - task:
       name: Automatic Speech Recognition
@@ -22,18 +22,18 @@ model-index:
     metrics:
     - name: Wer
       type: wer
-      value: 96.73659673659674
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
-# Whisper Large Hi - Gopika
-This model is a fine-tuned version of [openai/whisper-large](https://huggingface.co/openai/whisper-large) on the Konnakol dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.2174
-- Wer: 96.7366
 ## Model description
@@ -52,30 +52,30 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 1e-05
-- train_batch_size: 16
-- eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
-- training_steps: 10000
 - mixed_precision_training: Native AMP
 ### Training results
-| Training Loss | Epoch    | Step  | Validation Loss | Wer     |
-|:-------------:|:--------:|:-----:|:---------------:|:-------:|
-| 0.0735        | 21.7391  | 1000  | 1.3101          | 93.7063 |
-| 0.0146        | 43.4783  | 2000  | 1.7063          | 87.5291 |
-| 0.0059        | 65.2174  | 3000  | 1.9682          | 94.1725 |
-| 0.0072        | 86.9565  | 4000  | 1.9777          | 93.0070 |
-| 0.0036        | 108.6957 | 5000  | 2.0244          | 96.9697 |
-| 0.0021        | 130.4348 | 6000  | 2.0688          | 96.9697 |
-| 0.0025        | 152.1739 | 7000  | 2.1008          | 96.3869 |
-| 0.0028        | 173.9130 | 8000  | 2.1506          | 97.0862 |
-| 0.0034        | 195.6522 | 9000  | 2.1841          | 97.9021 |
-| 0.0026        | 217.3913 | 10000 | 2.2174          | 96.7366 |
 ### Framework versions

 language:
 - hi
 license: apache-2.0
+base_model: openai/whisper-small
 tags:
 - generated_from_trainer
 datasets:
 metrics:
 - wer
 model-index:
+- name: Whisper Small Hi - Gopika Krishnan
   results:
   - task:
       name: Automatic Speech Recognition
     metrics:
     - name: Wer
       type: wer
+      value: 87.64568764568764
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
+# Whisper Small Hi - Gopika Krishnan
+This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Konnakol dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.2352
+- Wer: 87.6457
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 32
+- eval_batch_size: 16
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
+- training_steps: 5000
 - mixed_precision_training: Native AMP
 ### Training results
+| Training Loss | Epoch    | Step | Validation Loss | Wer     |
+|:-------------:|:--------:|:----:|:---------------:|:-------:|
+| 0.1507        | 21.7391  | 500  | 1.2891          | 87.7622 |
+| 0.0428        | 43.4783  | 1000 | 1.4133          | 93.7063 |
+| 0.0111        | 65.2174  | 1500 | 1.7252          | 89.3939 |
+| 0.0063        | 86.9565  | 2000 | 1.8134          | 85.8974 |
+| 0.0035        | 108.6957 | 2500 | 2.0195          | 85.7809 |
+| 0.003         | 130.4348 | 3000 | 2.0771          | 87.8788 |
+| 0.0027        | 152.1739 | 3500 | 2.1378          | 87.5291 |
+| 0.0025        | 173.9130 | 4000 | 2.1730          | 86.4802 |
+| 0.0025        | 195.6522 | 4500 | 2.2126          | 87.8788 |
+| 0.0025        | 217.3913 | 5000 | 2.2352          | 87.6457 |
 ### Framework versions

generation_config.json CHANGED Viewed

@@ -1,40 +1,44 @@
 {
   "alignment_heads": [
     [
-      9,
-      19
     ],
     [
-      11,
-      2
     ],
     [
-      11,
-      4
     ],
     [
-      11,
-      17
     ],
     [
-      22,
       7
     ],
     [
-      22,
-      11
     ],
     [
-      22,
-      17
     ],
     [
-      23,
-      2
     ],
     [
-      23,
-      15
     ]
   ],
   "begin_suppress_tokens": [
@@ -146,6 +150,7 @@
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,

 {
   "alignment_heads": [
     [
+      5,
+      3
     ],
     [
+      5,
+      9
     ],
     [
+      8,
+      0
     ],
     [
+      8,
+      4
     ],
     [
+      8,
       7
     ],
     [
+      8,
+      8
     ],
     [
+      9,
+      0
     ],
     [
+      9,
+      7
+    ],
+    [
+      9,
+      9
     ],
     [
+      10,
+      5
     ]
   ],
   "begin_suppress_tokens": [
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
+  "language": "hindi",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e602d4f178354e6d3a11f49aff77724faa4466f5751f2a221487d031e13c3f7
 size 966995080

 version https://git-lfs.github.com/spec/v1
+oid sha256:072032d04333e568c87a151ce6cab4f820531b1218076deecdc8775e0250163e
 size 966995080