ekojs
/

internlm2-20b

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

ekojs commited on Feb 7

Commit

1f96903

•

1 Parent(s): 8be775a

Update tokenizer_config.json

Files changed (1) hide show

tokenizer_config.json +56 -11

tokenizer_config.json CHANGED Viewed

@@ -25,24 +25,69 @@
       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
   "auto_map": {
     "AutoTokenizer": [
-      "internlm/internlm2-20b--tokenization_internlm.InternLMTokenizer",
-      null
     ]
   },
   "bos_token": "<s>",
-  "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
-  "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
-  "sp_model_kwargs": {},
-  "spaces_between_special_tokens": false,
-  "tokenizer_class": "LlamaTokenizer",
-  "trust_remote_code": false,
-  "unk_token": "<unk>",
-  "use_default_system_prompt": false
-}

       "rstrip": false,
       "single_word": false,
       "special": true
+    },
+    "92538": {
+      "content": "<|plugin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "92539": {
+      "content": "<|interpreter|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "92540": {
+      "content": "<|action_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "92541": {
+      "content": "<|action_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "92542": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "92543": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
     }
   },
   "auto_map": {
     "AutoTokenizer": [
+      "LlamaTokenizer",
+      "LlamaTokenizerFast"
     ]
   },
   "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "decode_with_prefix_space": false,
   "eos_token": "</s>",
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
+  "sp_model_kwargs": null,
+  "tokenizer_class": "LlamaTokenizerFast",
+  "unk_token": "<unk>"
+}