deepdml commited on
Commit
0047465
1 Parent(s): 82e55f0

Training in progress, step 5

Browse files
added_tokens.json ADDED
@@ -0,0 +1 @@
 
1
+ {"<s>": 51, "</s>": 52}
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77656be03069b8daa203d5383c4936491871f7002ddf4732cd7d239ad24eef43
3
  size 143910
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c2b2e82339887ba6f01e7f784864f3ff7b65aeab8f30a9b10e2b6087512302
3
  size 143910
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "./output/", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f2f175d072062b719da3464b6fb6d166ba255f40e7adfec1b069e6d0c4b8aa4
3
  size 2991
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92e1628b89831b8faa1eeb20c5f236869a5cbe1a9325d410c940619f362c3462
3
  size 2991
vocab.json ADDED
@@ -0,0 +1 @@
 
1
+ {"!": 1, ",": 2, "-": 3, ".": 4, ":": 5, ";": 6, "?": 7, "а": 8, "б": 9, "в": 10, "г": 11, "д": 12, "е": 13, "ж": 14, "з": 15, "и": 16, "к": 17, "л": 18, "м": 19, "н": 20, "о": 21, "п": 22, "р": 23, "с": 24, "т": 25, "у": 26, "ф": 27, "х": 28, "ц": 29, "ч": 30, "ш": 31, "ы": 32, "ь": 33, "џ": 34, "қ": 35, "ҟ": 36, "ҩ": 37, "ҭ": 38, "ҳ": 39, "ҵ": 40, "ҷ": 41, "ҽ": 42, "ҿ": 43, "ә": 44, "ӡ": 45, "ӷ": 46, "ԥ": 47, "–": 48, "|": 0, "[UNK]": 49, "[PAD]": 50}