add tokenizer
Browse files
runs/Nov05_09-17-33_29f01e962d6c/1636103870.8574052/events.out.tfevents.1636103870.29f01e962d6c.78.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa1f2f8e07eaa5d39a334784067356b34643adb463a0b938172d2a84c2c43aaf
|
3 |
+
size 4576
|
runs/Nov05_09-17-33_29f01e962d6c/events.out.tfevents.1636103870.29f01e962d6c.78.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c557d8dd07751bf8f685557c97c10ed1b1fde5de78dea2b0a7728acb5205580b
|
3 |
+
size 4476
|
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"أ": 0, "ب": 1, "ظ": 2, "ث": 3, "ذ": 4, "؟": 5, "ي": 6, "ّ": 7, "ئ": 8, "،": 9, "ل": 10, "ز": 11, "ة": 12, "ح": 13, "ع": 14, "ض": 15, "ج": 16, "ن": 17, "َ": 18, "ق": 19, "ش": 20, "ص": 21, "ه": 22, "ر": 23, "إ": 24, "د": 25, "ت": 26, "خ": 27, "ً": 29, "ك": 30, "ؤ": 31, "م": 32, "ِ": 33, "ٍ": 34, "ء": 35, "ٌ": 36, "و": 37, "س": 38, "ُ": 39, "آ": 40, "ا": 41, "ط": 42, "ى": 43, "ف": 44, "ْ": 45, "غ": 46, "|": 28, "[UNK]": 47, "[PAD]": 48}
|