fd5e4dca535e8d001f91b5baf1336c188739846ec84c0d6958e2e84aa51d5bfb

Browse files

Files changed (6) hide show

README.md +7 -3
config.json +1 -55
model-00016-of-00016.safetensors +3 -0
model.safetensors.index.json +0 -0
tokenizer.json +4 -4
tokenizer_config.json +14 -5

README.md CHANGED Viewed

@@ -1,15 +1,19 @@
 ---
 license: apache-2.0
 tags:
 - mlx
 ---
 # mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit
-This model was converted to MLX format from [`mistralai/Mixtral-8x22B-Instruct-v0.1`]() using mlx-lm version **0.9.0**.
-Model added by [Prince Canuma](https://twitter.com/Prince_Canuma).
-Refer to the [original model card](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1) for more details on the model.
 ## Use with mlx
 ```bash

 ---
+language:
+- en
+- es
+- it
+- de
+- fr
 license: apache-2.0
 tags:
 - mlx
 ---
 # mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit
+The Model [mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit](https://huggingface.co/mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit) was converted to MLX format from [mistralai/Mixtral-8x22B-Instruct-v0.1](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1) using mlx-lm version **0.14.0**.
 ## Use with mlx
 ```bash

config.json CHANGED Viewed

@@ -1,87 +1,33 @@
 {
-    "add_cross_attention": false,
     "architectures": [
         "MixtralForCausalLM"
     ],
     "attention_dropout": 0.0,
-    "bad_words_ids": null,
-    "begin_suppress_tokens": null,
     "bos_token_id": 1,
-    "chunk_size_feed_forward": 0,
-    "cross_attention_hidden_size": null,
-    "decoder_start_token_id": null,
-    "diversity_penalty": 0.0,
-    "do_sample": false,
-    "early_stopping": false,
-    "encoder_no_repeat_ngram_size": 0,
     "eos_token_id": 2,
-    "exponential_decay_length_penalty": null,
-    "finetuning_task": null,
-    "forced_bos_token_id": null,
-    "forced_eos_token_id": null,
     "hidden_act": "silu",
     "hidden_size": 6144,
-    "id2label": {
-        "0": "LABEL_0",
-        "1": "LABEL_1"
-    },
     "initializer_range": 0.02,
     "intermediate_size": 16384,
-    "is_decoder": false,
-    "is_encoder_decoder": false,
-    "label2id": {
-        "LABEL_0": 0,
-        "LABEL_1": 1
-    },
-    "length_penalty": 1.0,
-    "max_length": 20,
     "max_position_embeddings": 65536,
-    "min_length": 0,
     "model_type": "mixtral",
-    "no_repeat_ngram_size": 0,
     "num_attention_heads": 48,
-    "num_beam_groups": 1,
-    "num_beams": 1,
     "num_experts_per_tok": 2,
     "num_hidden_layers": 56,
     "num_key_value_heads": 8,
     "num_local_experts": 8,
-    "num_return_sequences": 1,
-    "output_attentions": false,
-    "output_hidden_states": false,
     "output_router_logits": false,
-    "output_scores": false,
-    "pad_token_id": null,
-    "prefix": null,
-    "problem_type": null,
-    "pruned_heads": {},
     "quantization": {
         "group_size": 64,
         "bits": 4
     },
-    "remove_invalid_values": false,
-    "repetition_penalty": 1.0,
-    "return_dict": true,
-    "return_dict_in_generate": false,
     "rms_norm_eps": 1e-05,
     "rope_theta": 1000000.0,
     "router_aux_loss_coef": 0.001,
-    "sep_token_id": null,
     "sliding_window": null,
-    "suppress_tokens": null,
-    "task_specific_params": null,
-    "temperature": 1.0,
-    "tf_legacy_loss": false,
-    "tie_encoder_decoder": false,
     "tie_word_embeddings": false,
-    "tokenizer_class": null,
-    "top_k": 50,
-    "top_p": 1.0,
     "torch_dtype": "bfloat16",
-    "torchscript": false,
-    "transformers_version": "4.39.3",
-    "typical_p": 1.0,
-    "use_bfloat16": false,
     "use_cache": true,
     "vocab_size": 32768
 }

 {
     "architectures": [
         "MixtralForCausalLM"
     ],
     "attention_dropout": 0.0,
     "bos_token_id": 1,
     "eos_token_id": 2,
     "hidden_act": "silu",
     "hidden_size": 6144,
     "initializer_range": 0.02,
     "intermediate_size": 16384,
     "max_position_embeddings": 65536,
     "model_type": "mixtral",
     "num_attention_heads": 48,
     "num_experts_per_tok": 2,
     "num_hidden_layers": 56,
     "num_key_value_heads": 8,
     "num_local_experts": 8,
     "output_router_logits": false,
     "quantization": {
         "group_size": 64,
         "bits": 4
     },
     "rms_norm_eps": 1e-05,
     "rope_theta": 1000000.0,
     "router_aux_loss_coef": 0.001,
     "sliding_window": null,
     "tie_word_embeddings": false,
     "torch_dtype": "bfloat16",
+    "transformers_version": "4.38.0",
     "use_cache": true,
     "vocab_size": 32768
 }

model-00016-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cef97915a74a5e172c21766b15e8ae734fdca4368b07bcd08b4455cce4f06357
+size 1472239423

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.json CHANGED Viewed

@@ -76,8 +76,8 @@
       "special": true
     },
     {
-      "id": 9,
-      "content": "[/TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -85,8 +85,8 @@
       "special": true
     },
     {
-      "id": 32768,
-      "content": "[TOOL_RESULT]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

       "special": true
     },
     {
+      "id": 8,
+      "content": "[TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
       "special": true
     },
     {
+      "id": 9,
+      "content": "[/TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -66,16 +66,16 @@
       "single_word": false,
       "special": true
     },
-    "9": {
-      "content": "[/TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "32768": {
-      "content": "[TOOL_RESULT]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
@@ -85,7 +85,16 @@
   },
   "additional_special_tokens": [],
   "bos_token": "<s>",
-  "chat_template": "{{bos_token}}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ ' [INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "</s>",
   "legacy": true,

       "single_word": false,
       "special": true
     },
+    "8": {
+      "content": "[TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "9": {
+      "content": "[/TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
   },
   "additional_special_tokens": [],
   "bos_token": "<s>",
+  "chat_template": [
+    {
+      "name": "default",
+      "template": "{{bos_token}}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ ' [INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}"
+    },
+    {
+      "name": "tool_use",
+      "template": "{{bos_token}}{% set user_messages = messages | selectattr('role', 'equalto', 'user') | list %}{% for message in messages %}{% if message['role'] == 'user' %}{% if message == user_messages[-1] %}{% if tools %}{{'[AVAILABLE_TOOLS]'+ tools|string + '[/AVAILABLE_TOOLS]'}}{% endif %}{{ '[INST]' + message['content'] + '[/INST]' }}{% else %}{{ '[INST]' + message['content'] + '[/INST]' }}{% endif %}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% elif message['role'] == 'tool_results' %}{{'[TOOL_RESULTS]' + message['content']|string + '[/TOOL_RESULTS]'}}{% elif message['role'] == 'tool_calls' %}{{'[TOOL_CALLS]' + message['content']|string + eos_token}}{% endif %}{% endfor %}"
+    }
+  ],
   "clean_up_tokenization_spaces": false,
   "eos_token": "</s>",
   "legacy": true,