shljessie commited on
Commit
2195771
1 Parent(s): 867dd68

Training in progress, step 200

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-base",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -13,17 +13,17 @@
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
- "d_model": 512,
17
- "decoder_attention_heads": 8,
18
- "decoder_ffn_dim": 2048,
19
  "decoder_layerdrop": 0.0,
20
- "decoder_layers": 6,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
- "encoder_attention_heads": 8,
24
- "encoder_ffn_dim": 2048,
25
  "encoder_layerdrop": 0.0,
26
- "encoder_layers": 6,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": [
29
  [
@@ -52,7 +52,7 @@
52
  "max_target_positions": 448,
53
  "median_filter_width": 7,
54
  "model_type": "whisper",
55
- "num_hidden_layers": 6,
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
@@ -140,8 +140,6 @@
140
  49870,
141
  50254,
142
  50258,
143
- 50358,
144
- 50359,
145
  50360,
146
  50361,
147
  50362
 
1
  {
2
+ "_name_or_path": "openai/whisper-small",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
+ "d_model": 768,
17
+ "decoder_attention_heads": 12,
18
+ "decoder_ffn_dim": 3072,
19
  "decoder_layerdrop": 0.0,
20
+ "decoder_layers": 12,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
+ "encoder_attention_heads": 12,
24
+ "encoder_ffn_dim": 3072,
25
  "encoder_layerdrop": 0.0,
26
+ "encoder_layers": 12,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": [
29
  [
 
52
  "max_target_positions": 448,
53
  "median_filter_width": 7,
54
  "model_type": "whisper",
55
+ "num_hidden_layers": 12,
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
 
140
  49870,
141
  50254,
142
  50258,
 
 
143
  50360,
144
  50361,
145
  50362
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e39de275a755ba6fdc0b1f3d570095534357626eacb352ae4960e15469e48f0c
3
- size 290403936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:093323b0ab2336837151240e5c2bef7a48b98fd141e729719bb34d7587024023
3
+ size 966995080
runs/May28_01-49-27_bef95ffba252/events.out.tfevents.1716860972.bef95ffba252.256.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57cdaa777798c88c45f9f0775a4553c0cdcfc043ba7d62395def02b7086ec33a
3
+ size 7412
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7b62c56acb012288c61605427e170f005aea6b88c92df1660d2b5bb7a0f7993
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518bc8e526a5535c846340f5c6af347aff9bf78b63b03e55e5c5fd85b6df2830
3
  size 5304