dkleczek commited on
Commit
c8060dc
1 Parent(s): 918d78a

fixes to tokenizer

Browse files
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f73effd45f282fdecbce3d5bda192b346d1e2e5dc024d4493ff276656001a5b6
3
+ size 24
merges.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20832466756a988386123195ca6a4d1ecf92f0c1ff346872412fa54a8a2cb179
3
+ size 546522
special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0b3c279b6ecdb71996a86ffb4d4ab94dfdb5df95f00bac9515688faef2ff5dd
3
+ size 90
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:930138efc524dd7154f660fdfeafeac042f92640b7bf43df7c97fdc12e42140a
3
- size 1535805
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5fbc311f419d79d43b03e4675c06f0006119fd550ed72f3159d411fc8f83a82
3
+ size 1535928
tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85039a345c9cf46c6cdbb1789dd2b1885e0067c60ce8efa77c791f2aa467fa9b
3
+ size 208
vocab.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba07a419f1e025bb93d757d738e3af7853128053df7b880d4fb7ab851b646207
3
+ size 888217