1abf72c3398ae3bdbfe3876ef71c86a266c4229966d8170b459d605a20d52a6e

Browse files

Files changed (7) hide show

README.md +5 -1
added_tokens.json +6 -33
config.json +1 -1
sample_finetune.py +118 -29
special_tokens_map.json +0 -3
tokenizer.json +18 -261
tokenizer_config.json +19 -238

README.md CHANGED Viewed

@@ -8,10 +8,14 @@ tags:
 - mlx
 license_link: https://huggingface.co/microsoft/Phi-3-mini-4k-instruct/resolve/main/LICENSE
 pipeline_tag: text-generation
 ---
 # mlx-community/Phi-3-mini-4k-instruct-4bit-no-q-embed
-This model was converted to MLX format from [`microsoft/Phi-3-mini-4k-instruct`]() using mlx-lm version **0.10.0**.
 Refer to the [original model card](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) for more details on the model.
 ## Use with mlx

 - mlx
 license_link: https://huggingface.co/microsoft/Phi-3-mini-4k-instruct/resolve/main/LICENSE
 pipeline_tag: text-generation
+widget:
+- messages:
+  - role: user
+    content: Can you provide ways to eat combinations of bananas and dragonfruits?
 ---
 # mlx-community/Phi-3-mini-4k-instruct-4bit-no-q-embed
+This model was converted to MLX format from [`microsoft/Phi-3-mini-4k-instruct`]() using mlx-lm version **0.12.0**.
 Refer to the [original model card](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) for more details on the model.
 ## Use with mlx

added_tokens.json CHANGED Viewed

@@ -1,40 +1,13 @@
 {
-  "<|/code|>": 32014,
-  "<|/data|>": 32033,
-  "<|/inst|>": 32037,
-  "<|/query|>": 32031,
-  "<|/sys|>": 32035,
-  "<|assistant_mask|>": 32017,
   "<|assistant|>": 32001,
-  "<|calc|>": 32012,
-  "<|code|>": 32013,
-  "<|continue|>": 32009,
-  "<|data|>": 32032,
-  "<|diff_marker|>": 32025,
-  "<|disc_sep|>": 32029,
-  "<|disc_start|>": 32028,
-  "<|disc_thread|><|query|>": 32030,
   "<|endoftext|>": 32000,
   "<|end|>": 32007,
-  "<|fim_middle|>": 32021,
-  "<|fim_prefix|>": 32020,
-  "<|fim_suffix|>": 32022,
-  "<|function_call|>": 32005,
-  "<|function_list|>": 32011,
-  "<|function_output|>": 32003,
-  "<|ghissue|>": 32026,
-  "<|ghreview|>": 32027,
-  "<|inst|>": 32036,
-  "<|ipynb_marker|>": 32024,
-  "<|message|>": 32019,
-  "<|meta_start|>": 32023,
-  "<|raw|>": 32008,
-  "<|resource|>": 32016,
-  "<|start|>": 32018,
-  "<|step|>": 32002,
-  "<|summary|>": 32015,
   "<|system|>": 32006,
-  "<|sys|>": 32034,
-  "<|tag|>": 32004,
   "<|user|>": 32010
 }

 {
   "<|assistant|>": 32001,
   "<|endoftext|>": 32000,
   "<|end|>": 32007,
+  "<|placeholder1|>": 32002,
+  "<|placeholder2|>": 32003,
+  "<|placeholder3|>": 32004,
+  "<|placeholder4|>": 32005,
+  "<|placeholder5|>": 32008,
+  "<|placeholder6|>": 32009,
   "<|system|>": 32006,
   "<|user|>": 32010
 }

config.json CHANGED Viewed

@@ -29,7 +29,7 @@
     "rms_norm_eps": 1e-05,
     "rope_scaling": null,
     "rope_theta": 10000.0,
-    "sliding_window": 2048,
     "tie_word_embeddings": false,
     "torch_dtype": "bfloat16",
     "transformers_version": "4.39.3",

     "rms_norm_eps": 1e-05,
     "rope_scaling": null,
     "rope_theta": 10000.0,
+    "sliding_window": 2047,
     "tie_word_embeddings": false,
     "torch_dtype": "bfloat16",
     "transformers_version": "4.39.3",

sample_finetune.py CHANGED Viewed

@@ -1,28 +1,68 @@
-import torch
 from datasets import load_dataset
 from trl import SFTTrainer
-from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments
 """
 A simple example on using SFTTrainer and Accelerate to finetune Phi-3 models. For
-a more advanced example, please follow HF alignment-handbook/scripts/run_sft.py
-1. Install accelerate:
     conda install -c conda-forge accelerate
-2. Setup accelerate config:
     accelerate config
-to simply use all the GPUs available:
-    python -c "from accelerate.utils import write_basic_config; write_basic_config(mixed_precision='bf16')"
-check accelerate config:
     accelerate env
-3. Run the code:
     accelerate launch sample_finetune.py
 """
 ###################
 # Hyper-parameters
 ###################
-args = {
     "bf16": True,
     "do_eval": False,
     "learning_rate": 5.0e-06,
@@ -35,7 +75,7 @@ args = {
     "output_dir": "./checkpoint_dir",
     "overwrite_output_dir": True,
     "per_device_eval_batch_size": 4,
-    "per_device_train_batch_size": 8,
     "remove_unused_columns": True,
     "save_steps": 100,
     "save_total_limit": 1,
@@ -45,8 +85,43 @@ args = {
     "gradient_accumulation_steps": 1,
     "warmup_ratio": 0.2,
     }
-training_args = TrainingArguments(**args)
 ################
 # Modle Loading
@@ -58,14 +133,16 @@ model_kwargs = dict(
     trust_remote_code=True,
     attn_implementation="flash_attention_2",  # loading the model with flash-attenstion support
     torch_dtype=torch.bfloat16,
-    device_map="cuda",
 )
 model = AutoModelForCausalLM.from_pretrained(checkpoint_path, **model_kwargs)
 tokenizer = AutoTokenizer.from_pretrained(checkpoint_path)
 tokenizer.pad_token = tokenizer.unk_token  # use unk rather than eos token to prevent endless generation
 tokenizer.pad_token_id = tokenizer.convert_tokens_to_ids(tokenizer.pad_token)
 tokenizer.padding_side = 'right'
 ##################
 # Data Processing
 ##################
@@ -82,26 +159,36 @@ def apply_chat_template(
     return example
 raw_dataset = load_dataset("HuggingFaceH4/ultrachat_200k")
-column_names = list(raw_dataset["train_sft"].features)
-processed_dataset = raw_dataset.map(
     apply_chat_template,
     fn_kwargs={"tokenizer": tokenizer},
-    num_proc=12,
     remove_columns=column_names,
-    desc="Applying chat template",
 )
-train_dataset = processed_dataset["train_sft"]
-eval_dataset = processed_dataset["test_sft"]
 ###########
 # Training
 ###########
 trainer = SFTTrainer(
     model=model,
-    args=training_args,
-    train_dataset=train_dataset,
-    eval_dataset=eval_dataset,
     max_seq_length=2048,
     dataset_text_field="text",
     tokenizer=tokenizer,
@@ -113,16 +200,18 @@ trainer.log_metrics("train", metrics)
 trainer.save_metrics("train", metrics)
 trainer.save_state()
 #############
 # Evaluation
 #############
 tokenizer.padding_side = 'left'
 metrics = trainer.evaluate()
-metrics["eval_samples"] = len(eval_dataset)
 trainer.log_metrics("eval", metrics)
 trainer.save_metrics("eval", metrics)
-############
-# Save model
-############
-trainer.save_model(training_args.output_dir)

+import sys
+import logging
+import datasets
 from datasets import load_dataset
+from peft import LoraConfig
+import torch
+import transformers
 from trl import SFTTrainer
+from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments, BitsAndBytesConfig
 """
 A simple example on using SFTTrainer and Accelerate to finetune Phi-3 models. For
+a more advanced example, please follow HF alignment-handbook/scripts/run_sft.py.
+This example has utilized DeepSpeed ZeRO3 offload to reduce the memory usage. The
+script can be run on V100 or later generation GPUs. Here are some suggestions on
+futher reducing memory consumption:
+    - reduce batch size
+    - decrease lora dimension
+    - restrict lora target modules
+Please follow these steps to run the script:
+1. Install dependencies:
     conda install -c conda-forge accelerate
+    pip3 install -i https://pypi.org/simple/ bitsandbytes
+    pip3 install peft transformers trl datasets
+    pip3 install deepspeed
+2. Setup accelerate and deepspeed config based on the machine used:
     accelerate config
+Here is a sample config for deepspeed zero3:
+    compute_environment: LOCAL_MACHINE
+    debug: false
+    deepspeed_config:
+      gradient_accumulation_steps: 1
+      offload_optimizer_device: none
+      offload_param_device: none
+      zero3_init_flag: true
+      zero3_save_16bit_model: true
+      zero_stage: 3
+    distributed_type: DEEPSPEED
+    downcast_bf16: 'no'
+    enable_cpu_affinity: false
+    machine_rank: 0
+    main_training_function: main
+    mixed_precision: bf16
+    num_machines: 1
+    num_processes: 4
+    rdzv_backend: static
+    same_network: true
+    tpu_env: []
+    tpu_use_cluster: false
+    tpu_use_sudo: false
+    use_cpu: false
+3. check accelerate config:
     accelerate env
+4. Run the code:
     accelerate launch sample_finetune.py
 """
+logger = logging.getLogger(__name__)
 ###################
 # Hyper-parameters
 ###################
+training_config = {
     "bf16": True,
     "do_eval": False,
     "learning_rate": 5.0e-06,
     "output_dir": "./checkpoint_dir",
     "overwrite_output_dir": True,
     "per_device_eval_batch_size": 4,
+    "per_device_train_batch_size": 4,
     "remove_unused_columns": True,
     "save_steps": 100,
     "save_total_limit": 1,
     "gradient_accumulation_steps": 1,
     "warmup_ratio": 0.2,
     }
+peft_config = {
+    "r": 16,
+    "lora_alpha": 32,
+    "lora_dropout": 0.05,
+    "bias": "none",
+    "task_type": "CAUSAL_LM",
+    "target_modules": "all-linear",
+    "modules_to_save": None,
+}
+train_conf = TrainingArguments(**training_config)
+peft_conf = LoraConfig(**peft_config)
+###############
+# Setup logging
+###############
+logging.basicConfig(
+    format="%(asctime)s - %(levelname)s - %(name)s - %(message)s",
+    datefmt="%Y-%m-%d %H:%M:%S",
+    handlers=[logging.StreamHandler(sys.stdout)],
+)
+log_level = train_conf.get_process_log_level()
+logger.setLevel(log_level)
+datasets.utils.logging.set_verbosity(log_level)
+transformers.utils.logging.set_verbosity(log_level)
+transformers.utils.logging.enable_default_handler()
+transformers.utils.logging.enable_explicit_format()
+# Log on each process a small summary
+logger.warning(
+    f"Process rank: {train_conf.local_rank}, device: {train_conf.device}, n_gpu: {train_conf.n_gpu}"
+    + f" distributed training: {bool(train_conf.local_rank != -1)}, 16-bits training: {train_conf.fp16}"
+)
+logger.info(f"Training/evaluation parameters {train_conf}")
+logger.info(f"PEFT parameters {peft_conf}")
 ################
 # Modle Loading
     trust_remote_code=True,
     attn_implementation="flash_attention_2",  # loading the model with flash-attenstion support
     torch_dtype=torch.bfloat16,
+    device_map=None
 )
 model = AutoModelForCausalLM.from_pretrained(checkpoint_path, **model_kwargs)
 tokenizer = AutoTokenizer.from_pretrained(checkpoint_path)
+tokenizer.model_max_length = 2048
 tokenizer.pad_token = tokenizer.unk_token  # use unk rather than eos token to prevent endless generation
 tokenizer.pad_token_id = tokenizer.convert_tokens_to_ids(tokenizer.pad_token)
 tokenizer.padding_side = 'right'
 ##################
 # Data Processing
 ##################
     return example
 raw_dataset = load_dataset("HuggingFaceH4/ultrachat_200k")
+train_dataset = raw_dataset["train_sft"]
+test_dataset = raw_dataset["test_sft"]
+column_names = list(train_dataset.features)
+processed_train_dataset = train_dataset.map(
     apply_chat_template,
     fn_kwargs={"tokenizer": tokenizer},
+    num_proc=10,
     remove_columns=column_names,
+    desc="Applying chat template to train_sft",
 )
+processed_test_dataset = test_dataset.map(
+    apply_chat_template,
+    fn_kwargs={"tokenizer": tokenizer},
+    num_proc=10,
+    remove_columns=column_names,
+    desc="Applying chat template to test_sft",
+)
 ###########
 # Training
 ###########
 trainer = SFTTrainer(
     model=model,
+    args=train_conf,
+    peft_config=peft_conf,
+    train_dataset=processed_train_dataset,
+    eval_dataset=processed_test_dataset,
     max_seq_length=2048,
     dataset_text_field="text",
     tokenizer=tokenizer,
 trainer.save_metrics("train", metrics)
 trainer.save_state()
 #############
 # Evaluation
 #############
 tokenizer.padding_side = 'left'
 metrics = trainer.evaluate()
+metrics["eval_samples"] = len(processed_test_dataset)
 trainer.log_metrics("eval", metrics)
 trainer.save_metrics("eval", metrics)
+# ############
+# # Save model
+# ############
+trainer.save_model(train_conf.output_dir)

special_tokens_map.json CHANGED Viewed

@@ -1,7 +1,4 @@
 {
-  "additional_special_tokens": [
-    "<|/inst|>"
-  ],
   "bos_token": {
     "content": "<s>",
     "lstrip": false,

 {
   "bos_token": {
     "content": "<s>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -26,9 +26,9 @@
       "content": "</s>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
-      "special": false
     },
     {
       "id": 32000,
@@ -44,43 +44,43 @@
       "content": "<|assistant|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32002,
-      "content": "<|step|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32003,
-      "content": "<|function_output|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32004,
-      "content": "<|tag|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32005,
-      "content": "<|function_call|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
@@ -89,7 +89,7 @@
       "content": "<|system|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
@@ -98,25 +98,25 @@
       "content": "<|end|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32008,
-      "content": "<|raw|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
     {
       "id": 32009,
-      "content": "<|continue|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     },
@@ -125,250 +125,7 @@
       "content": "<|user|>",
       "single_word": false,
       "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32011,
-      "content": "<|function_list|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32012,
-      "content": "<|calc|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32013,
-      "content": "<|code|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32014,
-      "content": "<|/code|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32015,
-      "content": "<|summary|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32016,
-      "content": "<|resource|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32017,
-      "content": "<|assistant_mask|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32018,
-      "content": "<|start|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32019,
-      "content": "<|message|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32020,
-      "content": "<|fim_prefix|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32021,
-      "content": "<|fim_middle|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32022,
-      "content": "<|fim_suffix|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32023,
-      "content": "<|meta_start|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32024,
-      "content": "<|ipynb_marker|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32025,
-      "content": "<|diff_marker|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32026,
-      "content": "<|ghissue|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32027,
-      "content": "<|ghreview|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32028,
-      "content": "<|disc_start|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32029,
-      "content": "<|disc_sep|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32030,
-      "content": "<|disc_thread|><|query|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32031,
-      "content": "<|/query|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32032,
-      "content": "<|data|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32033,
-      "content": "<|/data|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32034,
-      "content": "<|sys|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32035,
-      "content": "<|/sys|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32036,
-      "content": "<|inst|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
-      "normalized": false,
-      "special": true
-    },
-    {
-      "id": 32037,
-      "content": "<|/inst|>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": true,
       "normalized": false,
       "special": true
     }

       "content": "</s>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
+      "special": true
     },
     {
       "id": 32000,
       "content": "<|assistant|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32002,
+      "content": "<|placeholder1|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32003,
+      "content": "<|placeholder2|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32004,
+      "content": "<|placeholder3|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32005,
+      "content": "<|placeholder4|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
       "content": "<|system|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
       "content": "<|end|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32008,
+      "content": "<|placeholder5|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
     {
       "id": 32009,
+      "content": "<|placeholder6|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     },
       "content": "<|user|>",
       "single_word": false,
       "lstrip": false,
+      "rstrip": false,
       "normalized": false,
       "special": true
     }

tokenizer_config.json CHANGED Viewed

@@ -22,9 +22,9 @@
       "content": "</s>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
-      "special": false
     },
     "32000": {
       "content": "<|endoftext|>",
@@ -38,39 +38,39 @@
       "content": "<|assistant|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32002": {
-      "content": "<|step|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32003": {
-      "content": "<|function_output|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32004": {
-      "content": "<|tag|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32005": {
-      "content": "<|function_call|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
@@ -78,7 +78,7 @@
       "content": "<|system|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
@@ -86,23 +86,23 @@
       "content": "<|end|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32008": {
-      "content": "<|raw|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
     "32009": {
-      "content": "<|continue|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     },
@@ -110,232 +110,13 @@
       "content": "<|user|>",
       "lstrip": false,
       "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32011": {
-      "content": "<|function_list|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32012": {
-      "content": "<|calc|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32013": {
-      "content": "<|code|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32014": {
-      "content": "<|/code|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32015": {
-      "content": "<|summary|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32016": {
-      "content": "<|resource|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32017": {
-      "content": "<|assistant_mask|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32018": {
-      "content": "<|start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32019": {
-      "content": "<|message|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32020": {
-      "content": "<|fim_prefix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32021": {
-      "content": "<|fim_middle|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32022": {
-      "content": "<|fim_suffix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32023": {
-      "content": "<|meta_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32024": {
-      "content": "<|ipynb_marker|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32025": {
-      "content": "<|diff_marker|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32026": {
-      "content": "<|ghissue|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32027": {
-      "content": "<|ghreview|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32028": {
-      "content": "<|disc_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32029": {
-      "content": "<|disc_sep|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32030": {
-      "content": "<|disc_thread|><|query|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32031": {
-      "content": "<|/query|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32032": {
-      "content": "<|data|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32033": {
-      "content": "<|/data|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32034": {
-      "content": "<|sys|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32035": {
-      "content": "<|/sys|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32036": {
-      "content": "<|inst|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": true
-    },
-    "32037": {
-      "content": "<|/inst|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": true,
       "single_word": false,
       "special": true
     }
   },
-  "additional_special_tokens": [
-    "<|/inst|>"
-  ],
   "bos_token": "<s>",
-  "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'system') %}{{'<|system|>' + '\n' + message['content'] + '<|end|>' + '\n'}}{% elif (message['role'] == 'user') %}{{'<|user|>' + '\n' + message['content'] + '<|end|>' + '\n' + '<|assistant|>' + '\n'}}{% elif message['role'] == 'assistant' %}{{message['content'] + '<|end|>' + '\n'}}{% endif %}{% endfor %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "legacy": false,

       "content": "</s>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
+      "special": true
     },
     "32000": {
       "content": "<|endoftext|>",
       "content": "<|assistant|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32002": {
+      "content": "<|placeholder1|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32003": {
+      "content": "<|placeholder2|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32004": {
+      "content": "<|placeholder3|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32005": {
+      "content": "<|placeholder4|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
       "content": "<|system|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
       "content": "<|end|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32008": {
+      "content": "<|placeholder5|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
     "32009": {
+      "content": "<|placeholder6|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     },
       "content": "<|user|>",
       "lstrip": false,
       "normalized": false,
+      "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
   "bos_token": "<s>",
+  "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') %}{{'<|user|>' + '\n' + message['content'] + '<|end|>' + '\n' + '<|assistant|>' + '\n'}}{% elif (message['role'] == 'assistant') %}{{message['content'] + '<|end|>' + '\n'}}{% endif %}{% endfor %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "legacy": false,