ZekeWang commited on
Commit
d9d1ad8
1 Parent(s): 6258dc2

Update Nanbeige1.5 8B Chat Model

Browse files
added_tokens.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
  "<|endoftext|>": 58980,
3
- "<|im_end|>": 58978,
4
- "<|im_start|>": 58979
5
  }
 
1
  {
2
  "<|endoftext|>": 58980,
3
+ "<|im_end|>": 58979,
4
+ "<|im_start|>": 58978
5
  }
config.json CHANGED
@@ -7,7 +7,7 @@
7
  "AutoModelForCausalLM": "modeling_nanbeige.NanbeigeForCausalLM"
8
  },
9
  "bos_token_id": 1,
10
- "eos_token_id": 58978,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
  "initializer_range": 0.02,
@@ -25,7 +25,7 @@
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "bfloat16",
28
- "transformers_version": "4.37.0",
29
  "use_cache": true,
30
  "vocab_size": 59392
31
  }
 
7
  "AutoModelForCausalLM": "modeling_nanbeige.NanbeigeForCausalLM"
8
  },
9
  "bos_token_id": 1,
10
+ "eos_token_id": 58979,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
  "initializer_range": 0.02,
 
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "bfloat16",
28
+ "transformers_version": "4.35.0",
29
  "use_cache": true,
30
  "vocab_size": 59392
31
  }
generation_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
- "eos_token_id": 58978,
5
  "max_length": 4096,
6
  "pad_token_id": 0,
7
  "do_sample": true,
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
+ "eos_token_id": 58979,
5
  "max_length": 4096,
6
  "pad_token_id": 0,
7
  "do_sample": true,
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18be302bfb6dea82e57be5a59543363935113c03d3fc6d43e203f1b3c59d10b2
3
  size 4972539320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c94b07a7e08d2e4020ddfc5b174af27361a7a99e36eb08da0624fd7d3201b20
3
  size 4972539320
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:569bfe51e2b0c021aaf576f5ad0962474b752294b2e1fd6b32db7e465c7a5c97
3
  size 4957876888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c080f13d52bd6d74de59eb8144ad92f0ff8d523dd80bb0fdcbc13f6f15f569f
3
  size 4957876888
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2512fd0bcf2917726595baf9ab525f9894665b8fcc7aba99074575f8b6a6fd1f
3
  size 4947390888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:188cca2bf9ab4130a11db62adb6189800c25d25086fbf318c82d09a9b2d3d1b4
3
  size 4947390888
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5630abbb5e933ba68921255cc8b9692f1ab5337ef61d98b3fbb9d2806e204b14
3
  size 666919584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37c82939cf09ec1b7c67dd4f06eeae3e151eb6b360ddb76ffefa59081dce5c98
3
  size 666919584
special_tokens_map.json CHANGED
@@ -1,4 +1,27 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": "<|im_start|>",
3
  "eos_token": "<|im_end|>",
4
  "pad_token": {
 
1
  {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<|im_start|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "<|im_end|>",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ ],
25
  "bos_token": "<|im_start|>",
26
  "eos_token": "<|im_end|>",
27
  "pad_token": {
tokenizer.json CHANGED
@@ -32,7 +32,7 @@
32
  },
33
  {
34
  "id": 58978,
35
- "content": "<|im_end|>",
36
  "single_word": false,
37
  "lstrip": false,
38
  "rstrip": false,
@@ -41,7 +41,7 @@
41
  },
42
  {
43
  "id": 58979,
44
- "content": "<|im_start|>",
45
  "single_word": false,
46
  "lstrip": false,
47
  "rstrip": false,
@@ -121,7 +121,7 @@
121
  "<|im_start|>": {
122
  "id": "<|im_start|>",
123
  "ids": [
124
- 58979
125
  ],
126
  "tokens": [
127
  "<|im_start|>"
 
32
  },
33
  {
34
  "id": 58978,
35
+ "content": "<|im_start|>",
36
  "single_word": false,
37
  "lstrip": false,
38
  "rstrip": false,
 
41
  },
42
  {
43
  "id": 58979,
44
+ "content": "<|im_end|>",
45
  "single_word": false,
46
  "lstrip": false,
47
  "rstrip": false,
 
121
  "<|im_start|>": {
122
  "id": "<|im_start|>",
123
  "ids": [
124
+ 58978
125
  ],
126
  "tokens": [
127
  "<|im_start|>"
tokenizer_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
@@ -25,7 +27,7 @@
25
  "special": true
26
  },
27
  "58978": {
28
- "content": "<|im_end|>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
@@ -33,7 +35,7 @@
33
  "special": true
34
  },
35
  "58979": {
36
- "content": "<|im_start|>",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
@@ -49,9 +51,11 @@
49
  "special": true
50
  }
51
  },
52
- "add_bos_token": false,
53
- "add_eos_token": false,
54
- "additional_special_tokens": [],
 
 
55
  "bos_token": "<|im_start|>",
56
  "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\n你是一个名为\"南北阁\"的人工智能助手,正在与人类用户进行交谈。你的目标是以最有帮助和最逻辑的方式回答问题,同时确保内容的安全性。你的回答中不应包含任何有害、政治化、宗教化、不道德、种族主义、非法的内容。请确保你的回答不带有社会偏见,符合社会主义价值观。如果遇到的问题无意义或事实上不连贯,请不要回答错误的内容,而是解释问题为何无效或不连贯。如果你不知道问题的答案,也请勿提供错误的信息。<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if (add_generation_prompt is defined and add_generation_prompt) %}{{ '<|im_start|>assistant\n' }}{% endif %}",
57
  "clean_up_tokenization_spaces": false,
 
1
  {
2
+ "add_bos_token": false,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
27
  "special": true
28
  },
29
  "58978": {
30
+ "content": "<|im_start|>",
31
  "lstrip": false,
32
  "normalized": false,
33
  "rstrip": false,
 
35
  "special": true
36
  },
37
  "58979": {
38
+ "content": "<|im_end|>",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
 
51
  "special": true
52
  }
53
  },
54
+ "additional_special_tokens": [
55
+ "<|im_start|>",
56
+ "<|im_end|>",
57
+ "<|endoftext|>"
58
+ ],
59
  "bos_token": "<|im_start|>",
60
  "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\n你是一个名为\"南北阁\"的人工智能助手,正在与人类用户进行交谈。你的目标是以最有帮助和最逻辑的方式回答问题,同时确保内容的安全性。你的回答中不应包含任何有害、政治化、宗教化、不道德、种族主义、非法的内容。请确保你的回答不带有社会偏见,符合社会主义价值观。如果遇到的问题无意义或事实上不连贯,请不要回答错误的内容,而是解释问题为何无效或不连贯。如果你不知道问题的答案,也请勿提供错误的信息。<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if (add_generation_prompt is defined and add_generation_prompt) %}{{ '<|im_start|>assistant\n' }}{% endif %}",
61
  "clean_up_tokenization_spaces": false,