hf-llm-api

Runtime error

Hansimov commited on Apr 11

Commit

3965e1f

•

1 Parent(s): ed5e0c7

:gem: [Feature] New model supported: command-r-plus (CohereForai/c4ai-command-r-plus)

Files changed (2) hide show

constants/models.py CHANGED Viewed

@@ -4,9 +4,11 @@ MODEL_MAP = {
     "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.2",
     "openchat-3.5": "openchat/openchat-3.5-0106",
     "gemma-7b": "google/gemma-7b-it",
     "default": "mistralai/Mixtral-8x7B-Instruct-v0.1",
 }
 STOP_SEQUENCES_MAP = {
     "mixtral-8x7b": "</s>",
@@ -14,6 +16,7 @@ STOP_SEQUENCES_MAP = {
     "mistral-7b": "</s>",
     "openchat-3.5": "<|end_of_turn|>",
     "gemma-7b": "<eos>",
 }
 TOKEN_LIMIT_MAP = {
@@ -23,20 +26,12 @@ TOKEN_LIMIT_MAP = {
     "openchat-3.5": 8192,
     "gemma-7b": 8192,
     "gpt-3.5-turbo": 8192,
 }
 TOKEN_RESERVED = 20
-AVAILABLE_MODELS = [
-    "mixtral-8x7b",
-    "nous-mixtral-8x7b",
-    "mistral-7b",
-    "openchat-3.5",
-    "gemma-7b",
-    "gpt-3.5-turbo",
-]
 # https://platform.openai.com/docs/api-reference/models/list
 AVAILABLE_MODELS_DICTS = [
     {
@@ -74,6 +69,13 @@ AVAILABLE_MODELS_DICTS = [
         "created": 1700000000,
         "owned_by": "Google",
     },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",

     "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.2",
     "openchat-3.5": "openchat/openchat-3.5-0106",
     "gemma-7b": "google/gemma-7b-it",
+    "command-r-plus": "CohereForAI/c4ai-command-r-plus",
     "default": "mistralai/Mixtral-8x7B-Instruct-v0.1",
 }
+AVAILABLE_MODELS = list(MODEL_MAP.keys())
 STOP_SEQUENCES_MAP = {
     "mixtral-8x7b": "</s>",
     "mistral-7b": "</s>",
     "openchat-3.5": "<|end_of_turn|>",
     "gemma-7b": "<eos>",
+    "command-r-plus": "<|END_OF_TURN_TOKEN|>",
 }
 TOKEN_LIMIT_MAP = {
     "openchat-3.5": 8192,
     "gemma-7b": 8192,
     "gpt-3.5-turbo": 8192,
+    "command-r-plus": 32768,
 }
 TOKEN_RESERVED = 20
 # https://platform.openai.com/docs/api-reference/models/list
 AVAILABLE_MODELS_DICTS = [
     {
         "created": 1700000000,
         "owned_by": "Google",
     },
+    {
+        "id": "command-r-plus",
+        "description": "[CohereForAI/c4ai-command-r-plus]: https://huggingface.co/CohereForAI/c4ai-command-r-plus",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "CohereForAI",
+    },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",

messagers/message_composer.py CHANGED Viewed

@@ -151,11 +151,15 @@ class MessageComposer:
         # https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
         # https://huggingface.co/openchat/openchat-3.5-0106
         # elif self.model in ["openchat-3.5", "nous-mixtral-8x7b"]:
-        else:
-            tokenizer = AutoTokenizer.from_pretrained("openchat/openchat-3.5-0106")
             self.merged_str = tokenizer.apply_chat_template(
                 messages, tokenize=False, add_generation_prompt=True
             )
         return self.merged_str
@@ -164,7 +168,8 @@ if __name__ == "__main__":
     # model = "mixtral-8x7b"
     # model = "nous-mixtral-8x7b"
     # model = "gemma-7b"
-    model = "openchat-3.5"
     composer = MessageComposer(model)
     messages = [
         {

         # https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO#prompt-format
         # https://huggingface.co/openchat/openchat-3.5-0106
         # elif self.model in ["openchat-3.5", "nous-mixtral-8x7b"]:
+        elif self.model in ["openchat-3.5", "command-r-plus"]:
+            tokenizer = AutoTokenizer.from_pretrained(self.model_fullname)
             self.merged_str = tokenizer.apply_chat_template(
                 messages, tokenize=False, add_generation_prompt=True
             )
+        else:
+            self.merged_str = "\n\n".join(
+                [f"{message['role']}: {message['content']}" for message in messages]
+            )
         return self.merged_str
     # model = "mixtral-8x7b"
     # model = "nous-mixtral-8x7b"
     # model = "gemma-7b"
+    # model = "openchat-3.5"
+    model = "command-r-plus"
     composer = MessageComposer(model)
     messages = [
         {