Upload folder using huggingface_hub

Browse files

Files changed (13) hide show

.gitattributes +0 -1
README.md +106 -0
added_tokens.json +4 -0
alphabet.json +1 -0
config.json +116 -0
language_model/5gram.bin +3 -0
language_model/attrs.json +1 -0
language_model/unigrams.txt +852 -0
preprocessor_config.json +10 -0
pytorch_model.bin +3 -0
special_tokens_map.json +148 -0
tokenizer_config.json +15 -0
vocab.json +98 -0

.gitattributes CHANGED Viewed

@@ -25,7 +25,6 @@
 *.safetensors filter=lfs diff=lfs merge=lfs -text
 saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tar filter=lfs diff=lfs merge=lfs -text
 *.tflite filter=lfs diff=lfs merge=lfs -text
 *.tgz filter=lfs diff=lfs merge=lfs -text
 *.wasm filter=lfs diff=lfs merge=lfs -text

 *.safetensors filter=lfs diff=lfs merge=lfs -text
 saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.tar.* filter=lfs diff=lfs merge=lfs -text
 *.tflite filter=lfs diff=lfs merge=lfs -text
 *.tgz filter=lfs diff=lfs merge=lfs -text
 *.wasm filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,106 @@

+---
+language: vi
+datasets:
+- youtube-vi-13k-hours
+tags:
+- speech
+license: cc-by-nc-4.0
+---
+# Vietnamese Self-Supervised Learning Wav2Vec2 model
+## Model
+We use wav2vec2 architecture for doing Self-Supervised learning
+<img src="https://raw.githubusercontent.com/patrickvonplaten/scientific_images/master/wav2vec2.png" width=75% height=75%>
+## Data
+Our self-supervised model is pre-trained on a massive audio set of 13k hours of Vietnamese youtube audio, which includes:
+  - Clean audio
+  - Noise audio
+  - Conversation
+  - Multi-gender and dialects
+## Download
+We have already upload our pre-trained model to the Huggingface. The base model trained 35 epochs and the large model trained 20 epochs in about 30 days using TPU V3-8.
+ - [Based version](https://huggingface.co/nguyenvulebinh/wav2vec2-base-vi) ~ 95M params
+ - [Large version](https://huggingface.co/nguyenvulebinh/wav2vec2-large-vi) ~ 317M params
+## Usage
+```python
+from transformers import Wav2Vec2ForPreTraining, Wav2Vec2Processor
+model_name = 'nguyenvulebinh/wav2vec2-base-vi'
+# model_name = 'nguyenvulebinh/wav2vec2-large-vi'
+model = Wav2Vec2ForPreTraining.from_pretrained(model_name)
+processor = Wav2Vec2Processor.from_pretrained(model_name)
+```
+Since our model has the same architecture as the English wav2vec2 version, you can use [this notebook](https://colab.research.google.com/drive/1FjTsqbYKphl9kL-eILgUc-bl4zVThL8F?usp=sharing) for more information on how to fine-tune the model.
+## Finetuned version
+### VLSP 2020 ASR dataset
+Benchmark WER result on VLSP T1 testset:
+| | [base model](https://huggingface.co/nguyenvulebinh/wav2vec2-base-vi-vlsp2020) | [large model](https://huggingface.co/nguyenvulebinh/wav2vec2-large-vi-vlsp2020) |
+|---|---|---|
+|without LM| 8.66  | 6.90 |
+|with 5-grams LM| 6.53 | 5.32 |
+Usage
+```python
+#pytorch
+#!pip install transformers==4.20.0
+#!pip install https://github.com/kpu/kenlm/archive/master.zip
+#!pip install pyctcdecode==0.4.0
+from transformers.file_utils import cached_path, hf_bucket_url
+from importlib.machinery import SourceFileLoader
+from transformers import Wav2Vec2ProcessorWithLM
+from IPython.lib.display import Audio
+import torchaudio
+import torch
+# Load model & processor
+model_name = "nguyenvulebinh/wav2vec2-base-vi-vlsp2020"
+# model_name = "nguyenvulebinh/wav2vec2-large-vi-vlsp2020"
+model = SourceFileLoader("model", cached_path(hf_bucket_url(model_name,filename="model_handling.py"))).load_module().Wav2Vec2ForCTC.from_pretrained(model_name)
+processor = Wav2Vec2ProcessorWithLM.from_pretrained(model_name)
+# Load an example audio (16k)
+audio, sample_rate = torchaudio.load(cached_path(hf_bucket_url(model_name, filename="t2_0000006682.wav")))
+input_data = processor.feature_extractor(audio[0], sampling_rate=16000, return_tensors='pt')
+# Infer
+output = model(**input_data)
+# Output transcript without LM
+print(processor.tokenizer.decode(output.logits.argmax(dim=-1)[0].detach().cpu().numpy()))
+# Output transcript with LM
+print(processor.decode(output.logits.cpu().detach().numpy()[0], beam_width=100).text)
+```
+## Acknowledgment
+- We would like to thank the Google TPU Research Cloud (TRC) program and Soonson Kwon (Google ML Ecosystem programs Lead) for their support.
+- Special thanks to my colleagues at [VietAI](https://vietai.org/) and [VAIS](https://vais.vn/) for their advice.
+## Contact
+nguyenvulebinh@gmail.com / binh@vietai.org
+[![Follow](https://img.shields.io/twitter/follow/nguyenvulebinh?style=social)](https://twitter.com/intent/follow?screen_name=nguyenvulebinh)

added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "</s>": 97,
+  "<s>": 96
+}

alphabet.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e0", "\u00e1", "\u00e2", "\u00e3", "\u00e8", "\u00e9", "\u00ea", "\u00ec", "\u00ed", "\u00f2", "\u00f3", "\u00f4", "\u00f5", "\u00f9", "\u00fa", "\u00fd", "\u0103", "\u0111", "\u0129", "\u0169", "\u01a1", "\u01b0", "\u1ea1", "\u1ea3", "\u1ea5", "\u1ea7", "\u1ea9", "\u1eab", "\u1ead", "\u1eaf", "\u1eb1", "\u1eb3", "\u1eb5", "\u1eb7", "\u1eb9", "\u1ebb", "\u1ebd", "\u1ebf", "\u1ec1", "\u1ec3", "\u1ec5", "\u1ec7", "\u1ec9", "\u1ecb", "\u1ecd", "\u1ecf", "\u1ed1", "\u1ed3", "\u1ed5", "\u1ed7", "\u1ed9", "\u1edb", "\u1edd", "\u1edf", "\u1ee1", "\u1ee3", "\u1ee5", "\u1ee7", "\u1ee9", "\u1eeb", "\u1eed", "\u1eef", "\u1ef1", "\u1ef3", "\u1ef5", "\u1ef7", "\u1ef9", "\u2047", "", "<s>", "</s>"], "is_bpe": false}

config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "./model-bin/wav2vec_pretrained/large/",
+  "activation_dropout": 0.0,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForPreTraining"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.1,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.1,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.075,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 0,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.23.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 96,
+  "xvector_output_dim": 512
+}

language_model/5gram.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd50eff6ccdeedf6f5672c824cd9c8ca3775a16d7e04962ae464fc56db656c2a
+size 2906312

language_model/attrs.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}

language_model/unigrams.txt ADDED Viewed

	@@ -0,0 +1,852 @@

+/21
+/47
+/giảm
+/hè
+0
+1
+10
+11
+12
+13
+14
+15
+16
+17
+18
+19
+2
+20
+21
+22
+23
+24
+25
+26
+27
+28
+29
+3
+30
+31
+32
+33
+34
+35
+36
+37
+38
+39
+4
+40
+41
+42
+43
+44
+45
+46
+47
+48
+49
+5
+50
+51
+52
+53
+54
+55
+56
+57
+58
+59
+6
+61
+62
+64
+65
+66
+7
+71
+72
+73
+74
+76
+77
+78
+8
+82
+83
+84
+85
+87
+88
+89
+9
+92
+95
+96
+97
+99
+</s>
+<s>
+a
+ai
+alo
+anh
+ayo
+ban
+bao
+biết
+buồn
+buổi
+bà
+bài
+bàn
+bách
+bánh
+báo
+bát
+bây
+bè
+bé
+béng
+bên
+bình
+bí
+bóng
+bạn
+bảo
+bẩn
+bận
+bật
+bắn
+bắt
+bếp
+bể
+bị
+bọn
+bỏ
+bố
+bồn
+bớt
+bởi
+bụi
+bữa
+c
+ca
+cafe
+camera
+chiếc
+chiếu
+chiều
+cho
+choạng
+chung
+chuyện
+chuẩn
+chà
+chào
+chán
+cháu
+cháy
+chín
+chính
+chói
+chùm
+chú
+chúng
+chút
+chơi
+chưa
+chạy
+chả
+chảy
+chậm
+chập
+chậu
+chắc
+chẳng
+chế
+chết
+chỉ
+chị
+chịu
+chồng
+chỗ
+chờ
+chờn
+chủ
+chứ
+chức
+chứng
+coi
+compact
+con
+cu
+cuối
+cuốn
+cuộc
+cài
+cá
+các
+cái
+cánh
+cáo
+cây
+còn
+có
+cô
+công
+cúng
+cũng
+cơ
+cơm
+cường
+cạnh
+cả
+cảm
+cảnh
+cất
+cần
+cầu
+cẩn
+cậu
+cổng
+cỡ
+của
+cứ
+cửa
+da
+do
+duy
+dõi
+dùm
+dùng
+dưng
+dướ
+dưới
+dược
+dạo
+dần
+dậy
+dẹp
+dến
+dễ
+dọn
+dở
+dụng
+e
+em
+eo
+fax
+game
+garage
+ghê
+gia
+giai
+gian
+giá
+giãn
+gió
+giùm
+giúp
+giảm
+giản
+giặt
+giờ
+giời
+giữ
+gym
+gà
+gác
+gái
+gì
+góc
+gúp
+gấp
+gần
+gặp
+haizz
+hanh
+hay
+hey
+hiên
+hình
+hiểu
+hiện
+hoa
+hoang
+hom
+hoà
+hoàng
+hoạt
+huy
+huỳnh
+huỷ
+hà
+hành
+hát
+hân
+hãng
+hãy
+hè
+héo
+hình
+hòa
+hóng
+hôi
+hôm
+hôn
+hộ
+hú
+hút
+hơi
+hơn
+hư
+hầm
+hắt
+hẳn
+hẵng
+hẹn
+hết
+họ
+học
+họp
+hỏng
+hồ
+hồng
+hỗ
+hộ
+hủy
+in
+karaoke
+kem
+khi
+khoàng
+khoảng
+khuya
+khá
+khách
+khét
+khí
+khó
+khói
+khô
+khôi
+không
+khả
+khắp
+khỏi
+kia
+kinh
+kiểm
+kiệm
+ko
+kéo
+kêu
+kìa
+kĩ
+kẹt
+kết
+kịch
+kịp
+lang
+laptop
+lau
+led
+len
+linh
+liệu
+loa
+long
+luôn
+là
+làm
+láng
+lát
+lâu
+lãng
+lên
+lênh
+lí
+lò
+lô
+lùa
+lùi
+lúc
+lý
+lưng
+lượng
+lạ
+lại
+lạnh
+lấy
+lập
+lắm
+lặng
+lịch
+lỗi
+lức
+mau
+minh
+miếng
+mua
+muốn
+muỗi
+muộn
+my
+mà
+màn
+mành
+màu
+mày
+mát
+máy
+mãi
+mình
+mính
+mùa
+mùi
+mưa
+mạn
+mạnh
+mất
+mấy
+mắt
+mặt
+mẹ
+mến
+mệt
+mọi
+mỏi
+một
+mới
+mờ
+mời
+mở
+mức
+nay
+ngay
+nghe
+nghi
+nghĩ
+nghơi
+nghỉ
+ngon
+ngoài
+ngày
+ngã
+ngôi
+ngơi
+người
+ngại
+ngạt
+ngập
+ngắt
+ngồi
+ngột
+ngủ
+nha
+nhanh
+nhà
+nhe
+nhi
+nhiên
+nhiều
+nhiệt
+nho
+nhà
+nhá
+nháp
+nhávào
+nháy
+nhân
+nhé
+nhìn
+nhòe
+nhó
+như
+nhưng
+nhạc
+nhảy
+nhấp
+nhập
+nhằng
+nhể
+nhỉ
+nhỏ
+nhớ
+nhớp
+nhờ
+nhở
+nhỡ
+nào
+này
+náy
+nãy
+nên
+nó
+nóng
+nôi
+nơi
+nước
+nướng
+nấc
+nấu
+nắng
+nặc
+nếu
+nối
+nồm
+nồng
+nổ
+nổi
+nội
+nửa
+nữ
+nữa
+nực
+oi
+ok
+okay
+oke
+okei
+om
+online
+pha
+phim
+phiền
+phát
+phía
+phòng
+phóng
+phút
+phải
+phỏng
+pin
+qua
+quang
+quay
+que
+quyết
+quá
+quân
+quên
+quạt
+quả
+quản
+quần
+ra
+radio
+riêng
+rè
+rèm
+rét
+ròi
+rõ
+rùi
+rượu
+rất
+rồi
+rời
+rủ
+rửa
+sa
+sai
+sang
+sao
+sau
+sen
+set
+sinh
+siri
+smarthome
+su
+suất
+suốt
+sàn
+sách
+sáng
+sân
+sóng
+sôi
+sư
+sưởi
+sạch
+sảnh
+sắp
+sẵn
+sẽ
+số
+sổ
+sớm
+sợ
+sợi
+sử
+sự
+ta
+tai
+tao
+tau
+tay
+thang
+thank
+thay
+theo
+thi
+thiết
+thiếu
+thiệt
+thoáng
+thu
+thui
+thành
+thân
+thèm
+thêm
+thì
+thôi
+thông
+thúc
+thăng
+thư
+thượng
+thả
+thấp
+thấy
+thật
+thắng
+thằng
+thế
+thể
+thịt
+thống
+thờ
+thời
+thức
+thử
+ti
+tin
+tiếng
+tiếp
+tiết
+tiền
+tiệc
+to
+toang
+toàn
+toé
+tra
+tranh
+treo
+trogn
+trong
+trung
+truyền
+tràn
+trái
+tráng
+trên
+trì
+tròn
+tròng
+trông
+trưa
+trưng
+trước
+trường
+trạng
+trầm
+trần
+trặc
+trặng
+trẻ
+trị
+trọ
+trộm
+trời
+trợ
+trụ
+trục
+trực
+tung
+tuyệt
+tuýp
+tài
+tâm
+tên
+tìm
+tình
+tí
+tính
+tôi
+tùng
+tý
+tăng
+tĩnh
+tư
+tưới
+tường
+tại
+tất
+tầm
+tầng
+tập
+tắm
+tắt
+tẹo
+tỉnh
+tốc
+tối
+tốn
+tốt
+tổ
+tớ
+tới
+tủ
+tức
+từ
+tự
+ui
+up
+uây
+uống
+van
+vi
+việc
+viện
+vui
+vy
+và
+vài
+vào
+ván
+vãi
+vì
+vòi
+vòng
+vô
+với
+vườn
+vấn
+vẫn
+vậy
+vắng
+vẻ
+về
+vệ
+vội
+với
+vời
+vợ
+vừa
+wc
+xa
+xe
+xem
+xin
+xong
+xuân
+xuống
+xài
+xách
+xép
+xíu
+xông
+xả
+xảy
+xịt
+you
+yên
+yêu
+yếu
+zai
+à
+ào
+á
+ánh
+áo
+áp
+âm
+ây
+ê
+í
+ít
+ô
+ôi
+ông
+ý
+ăn
+đang
+đau
+đi
+điên
+điều
+điện
+đâu
+đây
+đã
+đèn
+đê
+đêm
+đình
+đó
+đón
+đóng
+đông
+đúng
+đũa
+đơn
+đường
+được
+đại
+đạt
+đất
+đấy
+đầu
+đầy
+đắng
+đặt
+đẹp
+đến
+đề
+đền
+để
+định
+đọc
+đống
+đốt
+đồ
+đồng
+độ
+động
+đỡ
+đợi
+đủ
+đứa
+đứng
+đừng
+ơ
+ơi
+ơigiảm
+ơitắt
+ơn
+ưi
+ướt
+ạ
+ảnh
+ảo
+ấm
+ấy
+ẩm
+ế
+ề
+ốp
+ồn
+ổn
+ớ
+ới
+ờ
+ờm
+ở
+ủi
+ừm

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0.0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7936feb834fdea55f0968b2235bd9fd7367a0f954e412a6a8205be803943a89
+size 1269701863

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,148 @@

+{
+  "additional_special_tokens": [
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": false,
+  "eos_token": "</s>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "replace_word_delimiter_char": " ",
+  "target_lang": null,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "tokenizer_file": null,
+  "unk_token": "<unk>",
+  "word_delimiter_token": "|"
+}

vocab.json ADDED Viewed

	@@ -0,0 +1,98 @@

+{
+  "<pad>": 95,
+  "<unk>": 94,
+  "a": 1,
+  "b": 2,
+  "c": 3,
+  "d": 4,
+  "e": 5,
+  "f": 6,
+  "g": 7,
+  "h": 8,
+  "i": 9,
+  "j": 10,
+  "k": 11,
+  "l": 12,
+  "m": 13,
+  "n": 14,
+  "o": 15,
+  "p": 16,
+  "q": 17,
+  "r": 18,
+  "s": 19,
+  "t": 20,
+  "u": 21,
+  "v": 22,
+  "w": 23,
+  "x": 24,
+  "y": 25,
+  "z": 26,
+  "|": 0,
+  "à": 27,
+  "á": 28,
+  "â": 29,
+  "ã": 30,
+  "è": 31,
+  "é": 32,
+  "ê": 33,
+  "ì": 34,
+  "í": 35,
+  "ò": 36,
+  "ó": 37,
+  "ô": 38,
+  "õ": 39,
+  "ù": 40,
+  "ú": 41,
+  "ý": 42,
+  "ă": 43,
+  "đ": 44,
+  "ĩ": 45,
+  "ũ": 46,
+  "ơ": 47,
+  "ư": 48,
+  "ạ": 49,
+  "ả": 50,
+  "ấ": 51,
+  "ầ": 52,
+  "ẩ": 53,
+  "ẫ": 54,
+  "ậ": 55,
+  "ắ": 56,
+  "ằ": 57,
+  "ẳ": 58,
+  "ẵ": 59,
+  "ặ": 60,
+  "ẹ": 61,
+  "ẻ": 62,
+  "ẽ": 63,
+  "ế": 64,
+  "ề": 65,
+  "ể": 66,
+  "ễ": 67,
+  "ệ": 68,
+  "ỉ": 69,
+  "ị": 70,
+  "ọ": 71,
+  "ỏ": 72,
+  "ố": 73,
+  "ồ": 74,
+  "ổ": 75,
+  "ỗ": 76,
+  "ộ": 77,
+  "ớ": 78,
+  "ờ": 79,
+  "ở": 80,
+  "ỡ": 81,
+  "ợ": 82,
+  "ụ": 83,
+  "ủ": 84,
+  "ứ": 85,
+  "ừ": 86,
+  "ử": 87,
+  "ữ": 88,
+  "ự": 89,
+  "ỳ": 90,
+  "ỵ": 91,
+  "ỷ": 92,
+  "ỹ": 93
+}