ehristoforu commited on
Commit
a8e5e2a
1 Parent(s): 83e293e

Upload 5 files

Browse files
tokenizer_2/added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "!": 0,
3
+ "<|endoftext|>": 49407,
4
+ "<|startoftext|>": 49406
5
+ }
tokenizer_2/special_tokens_map.json CHANGED
@@ -1,24 +1,6 @@
1
  {
2
- "bos_token": {
3
- "content": "<|startoftext|>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
  "pad_token": "!",
17
- "unk_token": {
18
- "content": "<|endoftext|>",
19
- "lstrip": false,
20
- "normalized": true,
21
- "rstrip": false,
22
- "single_word": false
23
- }
24
  }
 
1
  {
2
+ "bos_token": "<|startoftext|>",
3
+ "eos_token": "<|endoftext|>",
 
 
 
 
 
 
 
 
 
 
 
 
4
  "pad_token": "!",
5
+ "unk_token": "<|endoftext|>"
 
 
 
 
 
 
6
  }
tokenizer_2/tokenizer_config.json CHANGED
@@ -15,17 +15,18 @@
15
  "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
- "special": true
19
  },
20
  "49407": {
21
  "content": "<|endoftext|>",
22
  "lstrip": false,
23
- "normalized": true,
24
  "rstrip": false,
25
  "single_word": false,
26
- "special": true
27
  }
28
  },
 
29
  "bos_token": "<|startoftext|>",
30
  "clean_up_tokenization_spaces": true,
31
  "do_lower_case": true,
@@ -34,5 +35,6 @@
34
  "model_max_length": 77,
35
  "pad_token": "!",
36
  "tokenizer_class": "CLIPTokenizer",
 
37
  "unk_token": "<|endoftext|>"
38
  }
 
15
  "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
+ "special": false
19
  },
20
  "49407": {
21
  "content": "<|endoftext|>",
22
  "lstrip": false,
23
+ "normalized": false,
24
  "rstrip": false,
25
  "single_word": false,
26
+ "special": false
27
  }
28
  },
29
+ "additional_special_tokens": [],
30
  "bos_token": "<|startoftext|>",
31
  "clean_up_tokenization_spaces": true,
32
  "do_lower_case": true,
 
35
  "model_max_length": 77,
36
  "pad_token": "!",
37
  "tokenizer_class": "CLIPTokenizer",
38
+ "tokenizer_file": "/home/user/.cache/huggingface/hub/models--laion--CLIP-ViT-bigG-14-laion2B-39B-b160k/snapshots/bc7788f151930d91b58474715fdce5524ad9a189/tokenizer.json",
39
  "unk_token": "<|endoftext|>"
40
  }