patrickvonplaten commited on
Commit
7a2589d
1 Parent(s): 056dbd7
Files changed (2) hide show
  1. config.json +1 -12
  2. preprocessor_config.json +9 -0
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
  "activation_dropout": 0.0,
3
- "apply_spec_augment": true,
4
  "architectures": [
5
  "UniSpeechForPreTraining"
6
  ],
@@ -8,7 +7,6 @@
8
  "bos_token_id": 1,
9
  "classifier_proj_size": 256,
10
  "codevector_dim": 768,
11
- "contrastive_logits_temperature": 0.1,
12
  "conv_bias": true,
13
  "conv_dim": [
14
  512,
@@ -37,9 +35,6 @@
37
  2,
38
  2
39
  ],
40
- "ctc_loss_reduction": "sum",
41
- "ctc_zero_infinity": false,
42
- "diversity_loss_weight": 0.1,
43
  "do_stable_layer_norm": true,
44
  "eos_token_id": 2,
45
  "feat_extract_activation": "gelu",
@@ -48,7 +43,6 @@
48
  "feat_proj_dropout": 0.1,
49
  "feat_quantizer_dropout": 0.0,
50
  "final_dropout": 0.0,
51
- "gradient_checkpointing": false,
52
  "hidden_act": "gelu",
53
  "hidden_dropout": 0.1,
54
  "hidden_size": 1024,
@@ -57,17 +51,12 @@
57
  "layer_norm_eps": 1e-05,
58
  "layerdrop": 0.1,
59
  "mask_channel_length": 10,
60
- "mask_channel_min_space": 1,
61
- "mask_channel_other": 0.0,
62
  "mask_channel_prob": 0.0,
63
- "mask_channel_selection": "static",
64
  "mask_feature_length": 10,
65
  "mask_feature_prob": 0.0,
66
  "mask_time_length": 10,
67
  "mask_time_min_space": 1,
68
- "mask_time_other": 0.0,
69
  "mask_time_prob": 0.075,
70
- "mask_time_selection": "static",
71
  "model_type": "unispeech",
72
  "num_attention_heads": 16,
73
  "num_codevector_groups": 2,
@@ -84,5 +73,5 @@
84
  "torch_dtype": "float32",
85
  "transformers_version": "4.12.0.dev0",
86
  "use_weighted_layer_sum": false,
87
- "vocab_size": 32
88
  }
 
1
  {
2
  "activation_dropout": 0.0,
 
3
  "architectures": [
4
  "UniSpeechForPreTraining"
5
  ],
 
7
  "bos_token_id": 1,
8
  "classifier_proj_size": 256,
9
  "codevector_dim": 768,
 
10
  "conv_bias": true,
11
  "conv_dim": [
12
  512,
 
35
  2,
36
  2
37
  ],
 
 
 
38
  "do_stable_layer_norm": true,
39
  "eos_token_id": 2,
40
  "feat_extract_activation": "gelu",
 
43
  "feat_proj_dropout": 0.1,
44
  "feat_quantizer_dropout": 0.0,
45
  "final_dropout": 0.0,
 
46
  "hidden_act": "gelu",
47
  "hidden_dropout": 0.1,
48
  "hidden_size": 1024,
 
51
  "layer_norm_eps": 1e-05,
52
  "layerdrop": 0.1,
53
  "mask_channel_length": 10,
 
 
54
  "mask_channel_prob": 0.0,
 
55
  "mask_feature_length": 10,
56
  "mask_feature_prob": 0.0,
57
  "mask_time_length": 10,
58
  "mask_time_min_space": 1,
 
59
  "mask_time_prob": 0.075,
 
60
  "model_type": "unispeech",
61
  "num_attention_heads": 16,
62
  "num_codevector_groups": 2,
 
73
  "torch_dtype": "float32",
74
  "transformers_version": "4.12.0.dev0",
75
  "use_weighted_layer_sum": false,
76
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor"
77
  }
preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }