Mahalakshmi commited on
Commit
ccbf2a9
1 Parent(s): adfe5f0

Update from Mahalakshmi

Browse files
.gitattributes CHANGED
@@ -25,3 +25,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ *.gitignore filter=lfs diff=lfs merge=lfs -text
29
+ *.json filter=lfs diff=lfs merge=lfs -text
30
+ *.arpa filter=lfs diff=lfs merge=lfs -text
31
+ *.txt filter=lfs diff=lfs merge=lfs -text
.gitignore CHANGED
@@ -1 +1,3 @@
1
- checkpoint-*/
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:750c10cd267eec2ff1b7afb10688e624b33cf558eef41ed63e00ef640e7fe38a
3
+ size 13
added_tokens.json CHANGED
@@ -1 +1,3 @@
1
- {"<s>": 52, "</s>": 53}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43526c6b42b96e56b0bc000b25b394f29fbe53324d4a6b0ec479eed43ae63349
3
+ size 23
alphabet.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2940b80d74250950dc253af7ecae795ea60a6a3c84558daa16e32879ef7bc5
3
+ size 548
config.json CHANGED
@@ -1,116 +1,3 @@
1
- {
2
- "_name_or_path": "facebook/wav2vec2-large-xlsr-53",
3
- "activation_dropout": 0.0,
4
- "adapter_kernel_size": 3,
5
- "adapter_stride": 2,
6
- "add_adapter": false,
7
- "apply_spec_augment": true,
8
- "architectures": [
9
- "Wav2Vec2ForCTC"
10
- ],
11
- "attention_dropout": 0.1,
12
- "bos_token_id": 1,
13
- "classifier_proj_size": 256,
14
- "codevector_dim": 768,
15
- "contrastive_logits_temperature": 0.1,
16
- "conv_bias": true,
17
- "conv_dim": [
18
- 512,
19
- 512,
20
- 512,
21
- 512,
22
- 512,
23
- 512,
24
- 512
25
- ],
26
- "conv_kernel": [
27
- 10,
28
- 3,
29
- 3,
30
- 3,
31
- 3,
32
- 2,
33
- 2
34
- ],
35
- "conv_stride": [
36
- 5,
37
- 2,
38
- 2,
39
- 2,
40
- 2,
41
- 2,
42
- 2
43
- ],
44
- "ctc_loss_reduction": "mean",
45
- "ctc_zero_infinity": false,
46
- "diversity_loss_weight": 0.1,
47
- "do_stable_layer_norm": true,
48
- "eos_token_id": 2,
49
- "feat_extract_activation": "gelu",
50
- "feat_extract_dropout": 0.0,
51
- "feat_extract_norm": "layer",
52
- "feat_proj_dropout": 0.0,
53
- "feat_quantizer_dropout": 0.0,
54
- "final_dropout": 0.0,
55
- "gradient_checkpointing": false,
56
- "hidden_act": "gelu",
57
- "hidden_dropout": 0.1,
58
- "hidden_size": 1024,
59
- "initializer_range": 0.02,
60
- "intermediate_size": 4096,
61
- "layer_norm_eps": 1e-05,
62
- "layerdrop": 0.1,
63
- "mask_channel_length": 10,
64
- "mask_channel_min_space": 1,
65
- "mask_channel_other": 0.0,
66
- "mask_channel_prob": 0.0,
67
- "mask_channel_selection": "static",
68
- "mask_feature_length": 10,
69
- "mask_feature_min_masks": 0,
70
- "mask_feature_prob": 0.0,
71
- "mask_time_length": 10,
72
- "mask_time_min_masks": 2,
73
- "mask_time_min_space": 1,
74
- "mask_time_other": 0.0,
75
- "mask_time_prob": 0.05,
76
- "mask_time_selection": "static",
77
- "model_type": "wav2vec2",
78
- "num_adapter_layers": 3,
79
- "num_attention_heads": 16,
80
- "num_codevector_groups": 2,
81
- "num_codevectors_per_group": 320,
82
- "num_conv_pos_embedding_groups": 16,
83
- "num_conv_pos_embeddings": 128,
84
- "num_feat_extract_layers": 7,
85
- "num_hidden_layers": 24,
86
- "num_negatives": 100,
87
- "output_hidden_size": 1024,
88
- "pad_token_id": 51,
89
- "proj_codevector_dim": 768,
90
- "tdnn_dilation": [
91
- 1,
92
- 2,
93
- 3,
94
- 1,
95
- 1
96
- ],
97
- "tdnn_dim": [
98
- 512,
99
- 512,
100
- 512,
101
- 512,
102
- 1500
103
- ],
104
- "tdnn_kernel": [
105
- 5,
106
- 3,
107
- 3,
108
- 1,
109
- 1
110
- ],
111
- "torch_dtype": "float32",
112
- "transformers_version": "4.17.0.dev0",
113
- "use_weighted_layer_sum": false,
114
- "vocab_size": 54,
115
- "xvector_output_dim": 512
116
- }
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8ede69bd2d13380480b53a8b3d13370a61081e3572b960f3135465e7e94659a
3
+ size 2314
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
language_model/5gram_correct.arpa ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b0c736f3e71c78722b9ba866e8255156f6023b6138f653d03554403796d0886
3
+ size 247315725
language_model/attrs.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5ffd02e1ceef6517476e72ebe7997ddef7e92d27cb5a23d6695d64c4317d6ad
3
+ size 78
language_model/unigrams.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f39385fac9c06769ac7a6259e5f39c8011bc5ff2f9a7d53f33a3f472ac51436f
3
+ size 3420726
preprocessor_config.json CHANGED
@@ -1,8 +1,3 @@
1
- {
2
- "do_normalize": true,
3
- "feature_size": 1,
4
- "padding_side": "right",
5
- "padding_value": 0.0,
6
- "return_attention_mask": true,
7
- "sampling_rate": 16000
8
- }
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c594304e9d9832162bedd5345051df29e8daf458a845cbed58c6ede23ceeae3
3
+ size 262
 
 
 
 
 
special_tokens_map.json CHANGED
@@ -1 +1,3 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d4108744f9b30c57365da221c760137c262a6ddfa4a71a9a68a561d7b842ee
3
+ size 502
tokenizer_config.json CHANGED
@@ -1 +1,3 @@
1
- {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "./", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82ffa4d0803a58aab0bb06b3cd4515c627058fb05d13d28e8091277be16de818
3
+ size 349
vocab.json CHANGED
@@ -1 +1,3 @@
1
- {"ீ": 0, "'": 1, "ு": 2, "த": 3, "ஞ": 4, "ி": 5, "ய": 6, "உ": 7, "ஒ": 8, "ை": 9, "ோ": 10, "ா": 11, "ஜ": 12, "ம": 13, "ஈ": 14, "ழ": 15, "ஏ": 16, "ல": 17, "ங": 18, "ள": 19, "ொ": 20, "ப": 21, "ஃ": 22, "ஆ": 23, "ூ": 24, "்": 25, "ௌ": 26, "ட": 27, "ஐ": 28, "அ": 29, "’": 30, "ெ": 31, "ற": 32, "ண": 33, "ச": 34, "வ": 35, "ஸ": 36, "ஔ": 37, "ன": 38, "ஷ": 39, "ஓ": 40, "ர": 41, "எ": 42, "ே": 44, "ஊ": 45, "ஹ": 46, "ந": 47, "இ": 48, "க": 49, "|": 43, "[UNK]": 50, "[PAD]": 51}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92d593af25445e3129a95927e45c84f8d4414d9322e4472ffb84bcbd87b965f8
3
+ size 562