Ojro commited on
Commit
62a208b
1 Parent(s): 78f8ccb

End of training

Browse files
README.md CHANGED
@@ -2,22 +2,22 @@
2
  language:
3
  - mn
4
  license: apache-2.0
5
- base_model: openai/whisper-tiny
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_13_0
10
  model-index:
11
- - name: Whisper Tiny MN - Ochirsukh Batbold
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
- # Whisper Tiny MN - Ochirsukh Batbold
19
 
20
- This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the Common Voice 13 mn dataset.
21
 
22
  ## Model description
23
 
@@ -38,12 +38,12 @@ More information needed
38
  The following hyperparameters were used during training:
39
  - learning_rate: 1e-05
40
  - train_batch_size: 32
41
- - eval_batch_size: 16
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
- - lr_scheduler_type: linear
45
- - lr_scheduler_warmup_steps: 500
46
- - training_steps: 3
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
 
2
  language:
3
  - mn
4
  license: apache-2.0
5
+ base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_13_0
10
  model-index:
11
+ - name: Whisper Tiny Mn - Ochirsukh Batbold
12
  results: []
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
+ # Whisper Tiny Mn - Ochirsukh Batbold
19
 
20
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 13 dataset.
21
 
22
  ## Model description
23
 
 
38
  The following hyperparameters were used during training:
39
  - learning_rate: 1e-05
40
  - train_batch_size: 32
41
+ - eval_batch_size: 32
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
+ - lr_scheduler_type: constant_with_warmup
45
+ - lr_scheduler_warmup_steps: 50
46
+ - training_steps: 5
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
config.json CHANGED
@@ -25,7 +25,20 @@
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 4,
27
  "eos_token_id": 50257,
28
- "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  "init_std": 0.02,
30
  "is_encoder_decoder": true,
31
  "mask_feature_length": 10,
@@ -43,10 +56,99 @@
43
  "num_mel_bins": 80,
44
  "pad_token_id": 50257,
45
  "scale_embedding": false,
46
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  "torch_dtype": "float32",
48
  "transformers_version": "4.35.2",
49
- "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51865
52
  }
 
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 4,
27
  "eos_token_id": 50257,
28
+ "forced_decoder_ids": [
29
+ [
30
+ 1,
31
+ 50259
32
+ ],
33
+ [
34
+ 2,
35
+ 50359
36
+ ],
37
+ [
38
+ 3,
39
+ 50363
40
+ ]
41
+ ],
42
  "init_std": 0.02,
43
  "is_encoder_decoder": true,
44
  "mask_feature_length": 10,
 
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
59
+ "suppress_tokens": [
60
+ 1,
61
+ 2,
62
+ 7,
63
+ 8,
64
+ 9,
65
+ 10,
66
+ 14,
67
+ 25,
68
+ 26,
69
+ 27,
70
+ 28,
71
+ 29,
72
+ 31,
73
+ 58,
74
+ 59,
75
+ 60,
76
+ 61,
77
+ 62,
78
+ 63,
79
+ 90,
80
+ 91,
81
+ 92,
82
+ 93,
83
+ 359,
84
+ 503,
85
+ 522,
86
+ 542,
87
+ 873,
88
+ 893,
89
+ 902,
90
+ 918,
91
+ 922,
92
+ 931,
93
+ 1350,
94
+ 1853,
95
+ 1982,
96
+ 2460,
97
+ 2627,
98
+ 3246,
99
+ 3253,
100
+ 3268,
101
+ 3536,
102
+ 3846,
103
+ 3961,
104
+ 4183,
105
+ 4667,
106
+ 6585,
107
+ 6647,
108
+ 7273,
109
+ 9061,
110
+ 9383,
111
+ 10428,
112
+ 10929,
113
+ 11938,
114
+ 12033,
115
+ 12331,
116
+ 12562,
117
+ 13793,
118
+ 14157,
119
+ 14635,
120
+ 15265,
121
+ 15618,
122
+ 16553,
123
+ 16604,
124
+ 18362,
125
+ 18956,
126
+ 20075,
127
+ 21675,
128
+ 22520,
129
+ 26130,
130
+ 26161,
131
+ 26435,
132
+ 28279,
133
+ 29464,
134
+ 31650,
135
+ 32302,
136
+ 32470,
137
+ 36865,
138
+ 42863,
139
+ 47425,
140
+ 49870,
141
+ 50254,
142
+ 50258,
143
+ 50358,
144
+ 50359,
145
+ 50360,
146
+ 50361,
147
+ 50362
148
+ ],
149
  "torch_dtype": "float32",
150
  "transformers_version": "4.35.2",
151
+ "use_cache": false,
152
  "use_weighted_layer_sum": false,
153
  "vocab_size": 51865
154
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f18415ab339cdd4698ee0b660d97a4bbb6f4cca8b341772fd7381753100d9a8
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54949258c437ee373da926ac04154414455d0d4c8161f0d20c82828c20a423b5
3
  size 151061672
runs/Nov28_09-23-37_icdcub-03/events.out.tfevents.1701163436.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:934c9fcd9cf58a86b3a89a06c7165c5306c93c910a870f5a31ca08bde8e538d2
3
+ size 5956
runs/Nov28_10-19-33_icdcub-03/events.out.tfevents.1701166775.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6bd47b8d20a784d2b149c8d819f95647374ed068c75ffbadf5b64351ac63d96
3
+ size 5956
runs/Nov28_10-23-32_icdcub-03/events.out.tfevents.1701167013.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4247a34d12da42733abdadc57ca7ba0886d95a2618979a80e01f41a9cbf3641
3
+ size 5956
runs/Nov28_10-27-02_icdcub-03/events.out.tfevents.1701167224.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:716bc42615079d14bb66e02ed7746278f0bbb571ed5eb5fbd88ec0c73438e893
3
+ size 6304
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea6c6158294e02ed53b0bd13afadcb1ae65fa6bb7321698a2c59266435b85e64
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c40a0d185694cc56c2fc9fdd331de68ac9ab8b26f410400080e9347dee3b02fa
3
  size 4283