add tokenizer
Browse files
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
runs/Feb22_17-03-19_jake-a-01/1645545892.3068602/events.out.tfevents.1645545892.jake-a-01.68786.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f6650e419da33a5a0378f1a21effc282ea2f066d0530e2a29897e7f73712869
|
3 |
+
size 4498
|
runs/Feb22_17-03-19_jake-a-01/events.out.tfevents.1645545892.jake-a-01.68786.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0077ffd7938ff715dd43449f2f3b0b6799105e9af50053a19b2589b0c5927b1
|
3 |
+
size 4407
|
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"p": 0, "'": 1, "c": 2, "k": 3, "n": 4, "e": 5, "t": 6, "i": 7, "j": 8, "g": 9, "o": 10, "h": 11, "y": 12, "u": 13, "z": 15, "r": 16, "a": 17, "l": 18, "q": 19, "v": 20, "b": 21, "f": 22, "m": 23, "w": 24, "x": 25, "s": 26, "d": 27, "|": 14, "[UNK]": 28, "[PAD]": 29}
|