empgces commited on
Commit
a867963
·
verified ·
1 Parent(s): 738a3b9

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (3) hide show
  1. special_tokens_map.json +3 -3
  2. tokenizer.json +0 -99
  3. tokenizer_config.json +3 -91
special_tokens_map.json CHANGED
@@ -7,17 +7,17 @@
7
  "single_word": false
8
  },
9
  "eos_token": {
10
- "content": "<|endoftext|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
- "content": "<|placeholder6|>",
18
  "lstrip": false,
19
  "normalized": false,
20
- "rstrip": true,
21
  "single_word": false
22
  },
23
  "unk_token": {
 
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "</s>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "<unk>",
18
  "lstrip": false,
19
  "normalized": false,
20
+ "rstrip": false,
21
  "single_word": false
22
  },
23
  "unk_token": {
tokenizer.json CHANGED
@@ -26,108 +26,9 @@
26
  "content": "</s>",
27
  "single_word": false,
28
  "lstrip": false,
29
- "rstrip": true,
30
- "normalized": false,
31
- "special": false
32
- },
33
- {
34
- "id": 32000,
35
- "content": "<|endoftext|>",
36
- "single_word": false,
37
- "lstrip": false,
38
  "rstrip": false,
39
  "normalized": false,
40
  "special": true
41
- },
42
- {
43
- "id": 32001,
44
- "content": "<|assistant|>",
45
- "single_word": false,
46
- "lstrip": false,
47
- "rstrip": true,
48
- "normalized": false,
49
- "special": true
50
- },
51
- {
52
- "id": 32002,
53
- "content": "<|placeholder1|>",
54
- "single_word": false,
55
- "lstrip": false,
56
- "rstrip": true,
57
- "normalized": false,
58
- "special": true
59
- },
60
- {
61
- "id": 32003,
62
- "content": "<|placeholder2|>",
63
- "single_word": false,
64
- "lstrip": false,
65
- "rstrip": true,
66
- "normalized": false,
67
- "special": true
68
- },
69
- {
70
- "id": 32004,
71
- "content": "<|placeholder3|>",
72
- "single_word": false,
73
- "lstrip": false,
74
- "rstrip": true,
75
- "normalized": false,
76
- "special": true
77
- },
78
- {
79
- "id": 32005,
80
- "content": "<|placeholder4|>",
81
- "single_word": false,
82
- "lstrip": false,
83
- "rstrip": true,
84
- "normalized": false,
85
- "special": true
86
- },
87
- {
88
- "id": 32006,
89
- "content": "<|system|>",
90
- "single_word": false,
91
- "lstrip": false,
92
- "rstrip": true,
93
- "normalized": false,
94
- "special": true
95
- },
96
- {
97
- "id": 32007,
98
- "content": "<|end|>",
99
- "single_word": false,
100
- "lstrip": false,
101
- "rstrip": true,
102
- "normalized": false,
103
- "special": true
104
- },
105
- {
106
- "id": 32008,
107
- "content": "<|placeholder5|>",
108
- "single_word": false,
109
- "lstrip": false,
110
- "rstrip": true,
111
- "normalized": false,
112
- "special": true
113
- },
114
- {
115
- "id": 32009,
116
- "content": "<|placeholder6|>",
117
- "single_word": false,
118
- "lstrip": false,
119
- "rstrip": true,
120
- "normalized": false,
121
- "special": true
122
- },
123
- {
124
- "id": 32010,
125
- "content": "<|user|>",
126
- "single_word": false,
127
- "lstrip": false,
128
- "rstrip": true,
129
- "normalized": false,
130
- "special": true
131
  }
132
  ],
133
  "normalizer": {
 
26
  "content": "</s>",
27
  "single_word": false,
28
  "lstrip": false,
 
 
 
 
 
 
 
 
 
29
  "rstrip": false,
30
  "normalized": false,
31
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
  }
33
  ],
34
  "normalizer": {
tokenizer_config.json CHANGED
@@ -22,106 +22,18 @@
22
  "content": "</s>",
23
  "lstrip": false,
24
  "normalized": false,
25
- "rstrip": true,
26
- "single_word": false,
27
- "special": false
28
- },
29
- "32000": {
30
- "content": "<|endoftext|>",
31
- "lstrip": false,
32
- "normalized": false,
33
  "rstrip": false,
34
  "single_word": false,
35
  "special": true
36
- },
37
- "32001": {
38
- "content": "<|assistant|>",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": true,
42
- "single_word": false,
43
- "special": true
44
- },
45
- "32002": {
46
- "content": "<|placeholder1|>",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": true,
50
- "single_word": false,
51
- "special": true
52
- },
53
- "32003": {
54
- "content": "<|placeholder2|>",
55
- "lstrip": false,
56
- "normalized": false,
57
- "rstrip": true,
58
- "single_word": false,
59
- "special": true
60
- },
61
- "32004": {
62
- "content": "<|placeholder3|>",
63
- "lstrip": false,
64
- "normalized": false,
65
- "rstrip": true,
66
- "single_word": false,
67
- "special": true
68
- },
69
- "32005": {
70
- "content": "<|placeholder4|>",
71
- "lstrip": false,
72
- "normalized": false,
73
- "rstrip": true,
74
- "single_word": false,
75
- "special": true
76
- },
77
- "32006": {
78
- "content": "<|system|>",
79
- "lstrip": false,
80
- "normalized": false,
81
- "rstrip": true,
82
- "single_word": false,
83
- "special": true
84
- },
85
- "32007": {
86
- "content": "<|end|>",
87
- "lstrip": false,
88
- "normalized": false,
89
- "rstrip": true,
90
- "single_word": false,
91
- "special": true
92
- },
93
- "32008": {
94
- "content": "<|placeholder5|>",
95
- "lstrip": false,
96
- "normalized": false,
97
- "rstrip": true,
98
- "single_word": false,
99
- "special": true
100
- },
101
- "32009": {
102
- "content": "<|placeholder6|>",
103
- "lstrip": false,
104
- "normalized": false,
105
- "rstrip": true,
106
- "single_word": false,
107
- "special": true
108
- },
109
- "32010": {
110
- "content": "<|user|>",
111
- "lstrip": false,
112
- "normalized": false,
113
- "rstrip": true,
114
- "single_word": false,
115
- "special": true
116
  }
117
  },
118
  "bos_token": "<s>",
119
- "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') %}{{'<|user|>' + '\n' + message['content'] + '<|end|>' + '\n' + '<|assistant|>' + '\n'}}{% elif (message['role'] == 'assistant') %}{{message['content'] + '<|end|>' + '\n'}}{% endif %}{% endfor %}",
120
  "clean_up_tokenization_spaces": false,
121
- "eos_token": "<|endoftext|>",
122
  "legacy": false,
123
  "model_max_length": 4096,
124
- "pad_token": "<|placeholder6|>",
125
  "padding_side": "left",
126
  "sp_model_kwargs": {},
127
  "tokenizer_class": "LlamaTokenizer",
 
22
  "content": "</s>",
23
  "lstrip": false,
24
  "normalized": false,
 
 
 
 
 
 
 
 
25
  "rstrip": false,
26
  "single_word": false,
27
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  }
29
  },
30
  "bos_token": "<s>",
31
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
32
  "clean_up_tokenization_spaces": false,
33
+ "eos_token": "</s>",
34
  "legacy": false,
35
  "model_max_length": 4096,
36
+ "pad_token": "<unk>",
37
  "padding_side": "left",
38
  "sp_model_kwargs": {},
39
  "tokenizer_class": "LlamaTokenizer",