unknown commited on
Commit
2a8a17a
1 Parent(s): ad7ebad

Coqui stt model for large Arabic vocabulary

Browse files
LICENCE.txt ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2021 Anas Hasni
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
README.md.txt ADDED
File without changes
alphabet.txt ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ء
3
+ ؤ
4
+ ا
5
+ ب
6
+ ة
7
+ ت
8
+ ث
9
+ ج
10
+ ح
11
+ خ
12
+ د
13
+ ذ
14
+ ر
15
+ ز
16
+ س
17
+ ش
18
+ ص
19
+ ض
20
+ ط
21
+ ظ
22
+ ع
23
+ غ
24
+ ف
25
+ ق
26
+ ك
27
+ ل
28
+ م
29
+ ن
30
+ ه
31
+ و
32
+ ى
33
+ ي
34
+ ٓ
35
+ ٔ
36
+ ی
best_dev-25350.data-00000-of-00001 ADDED
Binary file (10.3 MB). View file
 
best_dev-25350.index ADDED
Binary file (1.47 kB). View file
 
best_dev-25350.meta ADDED
Binary file (1.26 MB). View file
 
best_dev_checkpoint ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ model_checkpoint_path: "best_dev-25350"
2
+ all_model_checkpoint_paths: "best_dev-25350"
flags.txt ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train_files": [
3
+ "ar-train-dev/train.csv"
4
+ ],
5
+ "dev_files": [
6
+ "ar-train-dev/dev.csv"
7
+ ],
8
+ "test_files": [],
9
+ "metrics_files": [],
10
+ "read_buffer": 1048576,
11
+ "feature_cache": "",
12
+ "cache_for_epochs": 0,
13
+ "feature_win_len": 32,
14
+ "feature_win_step": 20,
15
+ "audio_sample_rate": 16000,
16
+ "normalize_sample_rate": true,
17
+ "augment": null,
18
+ "epochs": 20,
19
+ "dropout_rate": 0.05,
20
+ "dropout_rate2": 0.05,
21
+ "dropout_rate3": 0.05,
22
+ "dropout_rate4": 0.0,
23
+ "dropout_rate5": 0.0,
24
+ "dropout_rate6": 0.05,
25
+ "relu_clip": 20.0,
26
+ "beta1": 0.9,
27
+ "beta2": 0.999,
28
+ "epsilon": 1e-08,
29
+ "learning_rate": 0.001,
30
+ "train_batch_size": 16,
31
+ "dev_batch_size": 16,
32
+ "test_batch_size": 1,
33
+ "export_batch_size": 1,
34
+ "inter_op_parallelism_threads": 0,
35
+ "intra_op_parallelism_threads": 0,
36
+ "use_allow_growth": false,
37
+ "load_cudnn": false,
38
+ "train_cudnn": false,
39
+ "automatic_mixed_precision": false,
40
+ "limit_train": 0,
41
+ "limit_dev": 0,
42
+ "limit_test": 0,
43
+ "reverse_train": false,
44
+ "reverse_dev": false,
45
+ "reverse_test": false,
46
+ "checkpoint_dir": "",
47
+ "load_checkpoint_dir": "/workspace/.local/share/stt/checkpoints",
48
+ "save_checkpoint_dir": "checkpoints_arabic",
49
+ "checkpoint_secs": 600,
50
+ "max_to_keep": 5,
51
+ "load_train": "init",
52
+ "load_evaluate": "auto",
53
+ "drop_source_layers": 0,
54
+ "export_dir": "",
55
+ "remove_export": false,
56
+ "export_tflite": false,
57
+ "n_steps": 16,
58
+ "export_zip": false,
59
+ "export_file_name": "output_graph",
60
+ "export_beam_width": 500,
61
+ "export_author_id": "author",
62
+ "export_model_name": "model",
63
+ "export_model_version": "0.0.1",
64
+ "export_contact_info": "<public contact information of the author. Can be an email address, or a link to a contact form, issue tracker, or discussion forum. Must provide a way to reach the model authors>",
65
+ "export_license": "<SPDX identifier of the license of the exported model. See https://spdx.org/licenses/. If the license does not have an SPDX identifier, use the license name.>",
66
+ "export_language": "<language the model was trained on - IETF BCP 47 language tag including at least language, script and region subtags. E.g. \"en-Latn-UK\" or \"de-Latn-DE\" or \"cmn-Hans-CN\". Include as much info as you can without loss of precision. For example, if a model is trained on Scottish English, include the variant subtag: \"en-Latn-GB-Scotland\".>",
67
+ "export_min_stt_version": "<minimum Coqui STT version (inclusive) the exported model is compatible with>",
68
+ "export_max_stt_version": "<maximum Coqui STT version (inclusive) the exported model is compatible with>",
69
+ "export_description": "<Freeform description of the model being exported. Markdown accepted. You can also leave this flag unchanged and edit the generated .md file directly. Useful things to describe are demographic and acoustic characteristics of the data used to train the model, any architectural changes, names of public datasets that were used when applicable, hyperparameters used for training, evaluation results on standard benchmark datasets, etc.>",
70
+ "log_level": 1,
71
+ "show_progressbar": true,
72
+ "log_placement": false,
73
+ "report_count": 5,
74
+ "summary_dir": "/workspace/.local/share/stt/summaries",
75
+ "test_output_file": "",
76
+ "n_hidden": 256,
77
+ "layer_norm": false,
78
+ "random_seed": 4568,
79
+ "early_stop": false,
80
+ "es_epochs": 25,
81
+ "es_min_delta": 0.05,
82
+ "reduce_lr_on_plateau": false,
83
+ "plateau_epochs": 10,
84
+ "plateau_reduction": 0.1,
85
+ "force_initialize_learning_rate": false,
86
+ "bytes_output_mode": false,
87
+ "alphabet_config_path": "ar-train-dev/alphabet.txt",
88
+ "scorer_path": "",
89
+ "beam_width": 1024,
90
+ "lm_alpha": 0.931289039105002,
91
+ "lm_beta": 1.1834137581510284,
92
+ "cutoff_prob": 1.0,
93
+ "cutoff_top_n": 300,
94
+ "one_shot_infer": null,
95
+ "lm_alpha_max": 5,
96
+ "lm_beta_max": 5,
97
+ "n_trials": 2400
98
+ }