Tongjilibo commited on
Commit
3efe041
1 Parent(s): f4b7619

修改end_id为eos_token_i

Browse files
Files changed (49) hide show
  1. BELLE-LLaMA-7B-2M-enc/bert4torch_config.json +1 -1
  2. Llama-2-13b-chat-hf/bert4torch_config.json +1 -1
  3. Llama-2-13b-hf/bert4torch_config.json +1 -1
  4. Llama-2-7b-chat-hf/bert4torch_config.json +1 -1
  5. Llama-2-7b-hf/bert4torch_config.json +1 -1
  6. Meta-Llama-3-8B-Instruct/bert4torch_config.json +1 -1
  7. Meta-Llama-3-8B/bert4torch_config.json +1 -1
  8. Qwen-14B-Chat/bert4torch_config.json +1 -1
  9. Qwen-14B/bert4torch_config.json +1 -1
  10. Qwen-1_8B-Chat/bert4torch_config.json +1 -1
  11. Qwen-1_8B/bert4torch_config.json +1 -1
  12. Qwen-7B-Chat/bert4torch_config.json +1 -1
  13. Qwen-7B/bert4torch_config.json +1 -1
  14. Qwen1.5-0.5B-Chat/bert4torch_config.json +1 -1
  15. Qwen1.5-0.5B/bert4torch_config.json +1 -1
  16. Qwen1.5-1.8B-Chat/bert4torch_config.json +1 -1
  17. Qwen1.5-1.8B/bert4torch_config.json +1 -1
  18. Qwen1.5-14B-Chat/bert4torch_config.json +1 -1
  19. Qwen1.5-14B/bert4torch_config.json +1 -1
  20. Qwen1.5-7B-Chat/bert4torch_config.json +1 -1
  21. Qwen1.5-7B/bert4torch_config.json +1 -1
  22. Qwen2-0.5B-Instruct/bert4torch_config.json +1 -1
  23. Qwen2-0.5B/bert4torch_config.json +1 -1
  24. Qwen2-1.5B-Instruct/bert4torch_config.json +1 -1
  25. Qwen2-1.5B/bert4torch_config.json +1 -1
  26. Qwen2-7B-Instruct/bert4torch_config.json +1 -1
  27. Qwen2-7B/bert4torch_config.json +1 -1
  28. Yi-6B-200K/bert4torch_config.json +1 -1
  29. Yi-6B/bert4torch_config.json +1 -1
  30. Ziya-LLaMA-13B-v1.1/bert4torch_config.json +1 -1
  31. Ziya-LLaMA-13B-v1/bert4torch_config.json +1 -1
  32. chatglm3-6b-32k/bert4torch_config.json +1 -1
  33. chatglm3-6b/bert4torch_config.json +1 -1
  34. chinese_alpaca_plus_7b/bert4torch_config.json +1 -1
  35. chinese_llama_plus_7b/bert4torch_config.json +1 -1
  36. deepseek-moe-16b-base/bert4torch_config.json +1 -1
  37. glm-4-9b-chat-1m/bert4torch_config.json +1 -1
  38. glm-4-9b-chat/bert4torch_config.json +1 -1
  39. glm-4-9b/bert4torch_config.json +1 -1
  40. internlm-chat-7b/bert4torch_config.json +1 -1
  41. internlm2-1_8b/bert4torch_config.json +1 -1
  42. internlm2-7b/bert4torch_config.json +1 -1
  43. internlm2-chat-1_8b/bert4torch_config.json +1 -1
  44. internlm2-chat-7b/bert4torch_config.json +1 -1
  45. internlm2_5-7b-chat-1m/bert4torch_config.json +1 -1
  46. internlm2_5-7b-chat/bert4torch_config.json +1 -1
  47. internlm2_5-7b/bert4torch_config.json +1 -1
  48. llama-13b/bert4torch_config.json +1 -1
  49. llama-7b/bert4torch_config.json +1 -1
BELLE-LLaMA-7B-2M-enc/bert4torch_config.json CHANGED
@@ -11,5 +11,5 @@
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
15
  }
 
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
15
  }
Llama-2-13b-chat-hf/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "tie_word_embeddings": false,
19
  "torch_dtype": "float16",
20
  "convert_lm_logits_dtype": "float32",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"end_id": 2}
22
  }
 
18
  "tie_word_embeddings": false,
19
  "torch_dtype": "float16",
20
  "convert_lm_logits_dtype": "float32",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"eos_token_id": 2}
22
  }
Llama-2-13b-hf/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "tie_word_embeddings": false,
19
  "torch_dtype": "float16",
20
  "convert_lm_logits_dtype": "float32",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"end_id": 2}
22
  }
 
18
  "tie_word_embeddings": false,
19
  "torch_dtype": "float16",
20
  "convert_lm_logits_dtype": "float32",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"eos_token_id": 2}
22
  }
Llama-2-7b-chat-hf/bert4torch_config.json CHANGED
@@ -12,5 +12,5 @@
12
  "layer_norm_eps": 1e-6,
13
  "rope_rank": "updown",
14
  "convert_lm_logits_dtype": "float32",
15
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"end_id": 2}
16
  }
 
12
  "layer_norm_eps": 1e-6,
13
  "rope_rank": "updown",
14
  "convert_lm_logits_dtype": "float32",
15
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"eos_token_id": 2}
16
  }
Llama-2-7b-hf/bert4torch_config.json CHANGED
@@ -12,5 +12,5 @@
12
  "layer_norm_eps": 1e-5,
13
  "rope_rank": "updown",
14
  "convert_lm_logits_dtype": "float32",
15
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"end_id": 2}
16
  }
 
12
  "layer_norm_eps": 1e-5,
13
  "rope_rank": "updown",
14
  "convert_lm_logits_dtype": "float32",
15
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false},"eos_token_id": 2}
16
  }
Meta-Llama-3-8B-Instruct/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "tie_word_embeddings": false,
19
  "attention_probs_dropout_prob": 0.0,
20
  "convert_lm_logits_dtype": "float32",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false}, "end_id": [128001, 128009]}
22
  }
 
18
  "tie_word_embeddings": false,
19
  "attention_probs_dropout_prob": 0.0,
20
  "convert_lm_logits_dtype": "float32",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false}, "eos_token_id": [128001, 128009]}
22
  }
Meta-Llama-3-8B/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "tie_word_embeddings": false,
19
  "attention_probs_dropout_prob": 0.0,
20
  "convert_lm_logits_dtype": "float32",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false}, "end_id": [128001, 128009]}
22
  }
 
18
  "tie_word_embeddings": false,
19
  "attention_probs_dropout_prob": 0.0,
20
  "convert_lm_logits_dtype": "float32",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true, "add_special_tokens": false}, "eos_token_id": [128001, 128009]}
22
  }
Qwen-14B-Chat/bert4torch_config.json CHANGED
@@ -22,6 +22,6 @@
22
  "rope_rank": "updown",
23
  "max_position_embeddings": 8192,
24
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
25
- "skip_special_tokens": true}, "end_id": [151644, 151645],
26
  "max_length": 8192}
27
  }
 
22
  "rope_rank": "updown",
23
  "max_position_embeddings": 8192,
24
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
25
+ "skip_special_tokens": true}, "eos_token_id": [151644, 151645],
26
  "max_length": 8192}
27
  }
Qwen-14B/bert4torch_config.json CHANGED
@@ -22,6 +22,6 @@
22
  "rope_rank": "updown",
23
  "max_position_embeddings": 8192,
24
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
25
- "skip_special_tokens": true}, "end_id": [151643],
26
  "max_length": 8192}
27
  }
 
22
  "rope_rank": "updown",
23
  "max_position_embeddings": 8192,
24
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
25
+ "skip_special_tokens": true}, "eos_token_id": [151643],
26
  "max_length": 8192}
27
  }
Qwen-1_8B-Chat/bert4torch_config.json CHANGED
@@ -29,6 +29,6 @@
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
- "skip_special_tokens": true}, "end_id": [151644, 151645],
33
  "max_length": 8192}
34
  }
 
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
+ "skip_special_tokens": true}, "eos_token_id": [151644, 151645],
33
  "max_length": 8192}
34
  }
Qwen-1_8B/bert4torch_config.json CHANGED
@@ -29,6 +29,6 @@
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
- "skip_special_tokens": true}, "end_id": [151643],
33
  "max_length": 8192}
34
  }
 
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
+ "skip_special_tokens": true}, "eos_token_id": [151643],
33
  "max_length": 8192}
34
  }
Qwen-7B-Chat/bert4torch_config.json CHANGED
@@ -29,6 +29,6 @@
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
- "skip_special_tokens": true}, "end_id": [151644, 151645],
33
  "max_length": 8192}
34
  }
 
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
+ "skip_special_tokens": true}, "eos_token_id": [151644, 151645],
33
  "max_length": 8192}
34
  }
Qwen-7B/bert4torch_config.json CHANGED
@@ -29,6 +29,6 @@
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
- "skip_special_tokens": true}, "end_id": [151643],
33
  "max_length": 8192}
34
  }
 
29
  "rope_rank": "updown",
30
  "max_position": 8192,
31
  "generation_config": {"tokenizer_config": {"allowed_special": ["<|im_end|>", "<|im_start|>", "<|endoftext|>"],
32
+ "skip_special_tokens": true}, "eos_token_id": [151643],
33
  "max_length": 8192}
34
  }
Qwen1.5-0.5B-Chat/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen1.5-0.5B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen1.5-1.8B-Chat/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen1.5-1.8B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 21,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen1.5-14B-Chat/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 35,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 35,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen1.5-14B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 35,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 35,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen1.5-7B-Chat/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen1.5-7B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen2-0.5B-Instruct/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 24,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 24,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen2-0.5B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 24,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 24,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen2-1.5B-Instruct/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen2-1.5B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 32768,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Qwen2-7B-Instruct/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 131072,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 131072,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151644, 151645],
28
  "max_length": 32768}
29
  }
Qwen2-7B/bert4torch_config.json CHANGED
@@ -24,6 +24,6 @@
24
  "sliding_window": 131072,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [151643],
28
  "max_length": 32768}
29
  }
 
24
  "sliding_window": 131072,
25
  "max_window_layers": 28,
26
  "convert_lm_logits_dtype": "float32",
27
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [151643],
28
  "max_length": 32768}
29
  }
Yi-6B-200K/bert4torch_config.json CHANGED
@@ -19,7 +19,7 @@
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
  "segment_vocab_size": 0,
22
- "generation_config": {"tokenizer_decode_config": {"skip_special_tokens": true}, "max_length": 4096, "end_id": 2},
23
  "mapping": {
24
  "embeddings.word_embeddings.weight": "model.embed_tokens.weight",
25
  "LayerNormFinal.weight": "model.norm.weight",
 
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
  "segment_vocab_size": 0,
22
+ "generation_config": {"tokenizer_decode_config": {"skip_special_tokens": true}, "max_length": 4096, "eos_token_id": 2},
23
  "mapping": {
24
  "embeddings.word_embeddings.weight": "model.embed_tokens.weight",
25
  "LayerNormFinal.weight": "model.norm.weight",
Yi-6B/bert4torch_config.json CHANGED
@@ -19,7 +19,7 @@
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
  "segment_vocab_size": 0,
22
- "generation_config": {"tokenizer_decode_config": {"skip_special_tokens": true}, "max_length": 4096, "end_id": 2},
23
  "mapping": {
24
  "embeddings.word_embeddings.weight": "model.embed_tokens.weight",
25
  "LayerNormFinal.weight": "model.norm.weight",
 
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
  "segment_vocab_size": 0,
22
+ "generation_config": {"tokenizer_decode_config": {"skip_special_tokens": true}, "max_length": 4096, "eos_token_id": 2},
23
  "mapping": {
24
  "embeddings.word_embeddings.weight": "model.embed_tokens.weight",
25
  "LayerNormFinal.weight": "model.norm.weight",
Ziya-LLaMA-13B-v1.1/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "segment_vocab_size": 0,
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
22
  }
 
18
  "segment_vocab_size": 0,
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
22
  }
Ziya-LLaMA-13B-v1/bert4torch_config.json CHANGED
@@ -18,5 +18,5 @@
18
  "segment_vocab_size": 0,
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
22
  }
 
18
  "segment_vocab_size": 0,
19
  "skip_init": true,
20
  "rope_rank": "updown",
21
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
22
  }
chatglm3-6b-32k/bert4torch_config.json CHANGED
@@ -21,5 +21,5 @@
21
  "position_encoding_2d": true,
22
  "flash_attention": true,
23
  "generation_config": {"tokenizer_config": {"additional_special_tokens": ["<|user|>", "<|observation|>"],
24
- "skip_special_tokens": true}, "end_id": [2, 64795, 64797], "max_length": 32768}
25
  }
 
21
  "position_encoding_2d": true,
22
  "flash_attention": true,
23
  "generation_config": {"tokenizer_config": {"additional_special_tokens": ["<|user|>", "<|observation|>"],
24
+ "skip_special_tokens": true}, "eos_token_id": [2, 64795, 64797], "max_length": 32768}
25
  }
chatglm3-6b/bert4torch_config.json CHANGED
@@ -20,5 +20,5 @@
20
  "position_encoding_2d": true,
21
  "flash_attention": true,
22
  "generation_config": {"tokenizer_config": {"additional_special_tokens": ["<|user|>", "<|observation|>"],
23
- "skip_special_tokens": true}, "end_id": [2, 64795, 64797], "max_length": 8192}
24
  }
 
20
  "position_encoding_2d": true,
21
  "flash_attention": true,
22
  "generation_config": {"tokenizer_config": {"additional_special_tokens": ["<|user|>", "<|observation|>"],
23
+ "skip_special_tokens": true}, "eos_token_id": [2, 64795, 64797], "max_length": 8192}
24
  }
chinese_alpaca_plus_7b/bert4torch_config.json CHANGED
@@ -11,5 +11,5 @@
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
15
  }
 
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
15
  }
chinese_llama_plus_7b/bert4torch_config.json CHANGED
@@ -11,5 +11,5 @@
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
15
  }
 
11
  "segment_vocab_size": 0,
12
  "skip_init": true,
13
  "rope_rank": "updown",
14
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
15
  }
deepseek-moe-16b-base/bert4torch_config.json CHANGED
@@ -32,5 +32,5 @@
32
  "skip_init": true,
33
  "segment_vocab_size": 0,
34
  "rope_rank": "updown",
35
- "generation_config": {"tokenizer_config": {"add_special_tokens": false, "skip_special_tokens": true}, "max_length": 4096, "end_id": 100001}
36
  }
 
32
  "skip_init": true,
33
  "segment_vocab_size": 0,
34
  "rope_rank": "updown",
35
+ "generation_config": {"tokenizer_config": {"add_special_tokens": false, "skip_special_tokens": true}, "max_length": 4096, "eos_token_id": 100001}
36
  }
glm-4-9b-chat-1m/bert4torch_config.json CHANGED
@@ -21,5 +21,5 @@
21
  "eos_token_id": [151329, 151336, 151338],
22
  "pad_token_id": 151329,
23
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
24
- "end_id": [151329, 151336, 151338], "max_length": 131072}
25
  }
 
21
  "eos_token_id": [151329, 151336, 151338],
22
  "pad_token_id": 151329,
23
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
24
+ "eos_token_id": [151329, 151336, 151338], "max_length": 131072}
25
  }
glm-4-9b-chat/bert4torch_config.json CHANGED
@@ -21,5 +21,5 @@
21
  "eos_token_id": [151329, 151336, 151338],
22
  "pad_token_id": 151329,
23
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
24
- "end_id": [151329, 151336, 151338], "max_length": 131072}
25
  }
 
21
  "eos_token_id": [151329, 151336, 151338],
22
  "pad_token_id": 151329,
23
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
24
+ "eos_token_id": [151329, 151336, 151338], "max_length": 131072}
25
  }
glm-4-9b/bert4torch_config.json CHANGED
@@ -20,5 +20,5 @@
20
  "eos_token_id": [151329, 151336, 151338],
21
  "pad_token_id": 151329,
22
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
23
- "end_id": [151329, 151336, 151338], "max_length": 131072}
24
  }
 
20
  "eos_token_id": [151329, 151336, 151338],
21
  "pad_token_id": 151329,
22
  "generation_config": {"tokenizer_config": {"skip_special_tokens": true},
23
+ "eos_token_id": [151329, 151336, 151338], "max_length": 131072}
24
  }
internlm-chat-7b/bert4torch_config.json CHANGED
@@ -13,5 +13,5 @@
13
  "rope_rank": "updown",
14
  "torch_dtype": "float16",
15
  "tie_word_embeddings": false,
16
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "end_id": [2, 103028], "max_length": 2048}
17
  }
 
13
  "rope_rank": "updown",
14
  "torch_dtype": "float16",
15
  "tie_word_embeddings": false,
16
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "eos_token_id": [2, 103028], "max_length": 2048}
17
  }
internlm2-1_8b/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "rope_rank": "updown",
25
  "torch_dtype": "float16",
26
  "vocab_size": 92544,
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "rope_rank": "updown",
25
  "torch_dtype": "float16",
26
  "vocab_size": 92544,
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
internlm2-7b/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
internlm2-chat-1_8b/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "rope_rank": "updown",
25
  "torch_dtype": "float16",
26
  "vocab_size": 92544,
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "rope_rank": "updown",
25
  "torch_dtype": "float16",
26
  "vocab_size": 92544,
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
internlm2-chat-7b/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
internlm2_5-7b-chat-1m/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
- "generation_config": {"end_id": [2, 92542], "max_length": 262144}
28
  }
 
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 262144}
28
  }
internlm2_5-7b-chat/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
internlm2_5-7b/bert4torch_config.json CHANGED
@@ -24,5 +24,5 @@
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
- "generation_config": {"end_id": [2, 92542], "max_length": 32768}
28
  }
 
24
  "segment_vocab_size": 0,
25
  "skip_init": true,
26
  "rope_rank": "updown",
27
+ "generation_config": {"eos_token_id": [2, 92542], "max_length": 32768}
28
  }
llama-13b/bert4torch_config.json CHANGED
@@ -13,5 +13,5 @@
13
  "skip_init": true,
14
  "rope_rank": "updown",
15
  "convert_lm_logits_dtype": "float32",
16
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
17
  }
 
13
  "skip_init": true,
14
  "rope_rank": "updown",
15
  "convert_lm_logits_dtype": "float32",
16
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
17
  }
llama-7b/bert4torch_config.json CHANGED
@@ -13,5 +13,5 @@
13
  "skip_init": true,
14
  "rope_rank": "updown",
15
  "convert_lm_logits_dtype": "float32",
16
- "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "end_id": 2}
17
  }
 
13
  "skip_init": true,
14
  "rope_rank": "updown",
15
  "convert_lm_logits_dtype": "float32",
16
+ "generation_config": {"tokenizer_config": {"skip_special_tokens": true}, "max_length": 2048, "eos_token_id": 2}
17
  }