Update README.md
Browse files
README.md
CHANGED
@@ -17,6 +17,36 @@ This modelcard aims to be a base template for new models. It has been generated
|
|
17 |
|
18 |
<!-- Provide a longer summary of what this model is. -->
|
19 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
20 |
|
21 |
|
22 |
- **Developed by:** [More Information Needed]
|
|
|
17 |
|
18 |
<!-- Provide a longer summary of what this model is. -->
|
19 |
|
20 |
+
```
|
21 |
+
class WhisperCTC(nn.Module):
|
22 |
+
def __init__(
|
23 |
+
self,
|
24 |
+
encoder_id: str = "tuanio/whisper-encoder.tiny.en",
|
25 |
+
dropout: float = 0.1,
|
26 |
+
vocab_size: int = 47,
|
27 |
+
):
|
28 |
+
super().__init__()
|
29 |
+
self.encoder = WhisperEncoder.from_pretrained(encoder_id)
|
30 |
+
print("Freezing Whisper Encoder...")
|
31 |
+
self.encoder._freeze_parameters()
|
32 |
+
print("Freezed!")
|
33 |
+
self.lm_head = nn.Sequential(
|
34 |
+
nn.SiLU(),
|
35 |
+
nn.Dropout(dropout),
|
36 |
+
nn.Linear(self.encoder.config.d_model, vocab_size),
|
37 |
+
)
|
38 |
+
nn.init.kaiming_uniform_(
|
39 |
+
self.lm_head[-1].weight, mode="fan_in", nonlinearity="relu"
|
40 |
+
)
|
41 |
+
|
42 |
+
def forward(self, feat: Tensor, attn_mask: Tensor):
|
43 |
+
enc = self.encoder(
|
44 |
+
input_features=feat, attention_mask=attn_mask
|
45 |
+
).last_hidden_state
|
46 |
+
logits = self.lm_head(enc)
|
47 |
+
log_probs = nn.functional.log_softmax(logits, dim=-1)
|
48 |
+
return log_probs
|
49 |
+
```
|
50 |
|
51 |
|
52 |
- **Developed by:** [More Information Needed]
|