add tokenizer
Browse files
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
runs/Dec19_07-13-10_d1bce08cd577/1639898068.3655849/events.out.tfevents.1639898068.d1bce08cd577.660.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f85395c66f6c49196af6ca9cf9662bba5224cd27600ef57561c521ae4224ce6
|
3 |
+
size 4537
|
runs/Dec19_07-13-10_d1bce08cd577/events.out.tfevents.1639898068.d1bce08cd577.660.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:186b9d79a315b0be33794ed85d31a886717be170f04cbc098fc797ebdd054ee8
|
3 |
+
size 4447
|
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"v": 0, "j": 1, "'": 2, "y": 3, "k": 4, "w": 5, "n": 6, "x": 7, "r": 8, "a": 10, "b": 11, "e": 12, "t": 13, "p": 14, "f": 15, "o": 16, "d": 17, "g": 18, "q": 19, "c": 20, "m": 21, "h": 22, "s": 23, "l": 24, "u": 25, "z": 26, "i": 27, "|": 9, "[UNK]": 28, "[PAD]": 29}
|