Spaces:

yanolja
/

arena

Running

App Files Files Community

Kang Suhyun commited on Jul 3

Commit

2667b32

•

1 Parent(s): 5cbd838

[#115|#116] Reintroduce EEVE (#121)

Browse files

* [#115|#116] Reintroduce EEVE

* _get_completion_kwargs

* remove print

* fix

* inline

Files changed (1) hide show

model.py +40 -8

model.py CHANGED Viewed

@@ -3,6 +3,7 @@ This module contains functions to interact with the models.
 """
 import json
 from typing import List
 import litellm
@@ -48,15 +49,15 @@ Output following this JSON format:
         "role": "user",
         "content": prompt
     }]
     try:
-      response = litellm.completion(
-          model=self.provider + "/" + self.name if self.provider else self.name,
-          api_key=self.api_key,
-          api_base=self.api_base,
-          messages=messages,
-          max_tokens=max_tokens,
-          # Ref: https://litellm.vercel.app/docs/completion/input#optional-fields # pylint: disable=line-too-long
-          response_format={"type": "json_object"})
       json_response = response.choices[0].message.content
       parsed_json = json.loads(json_response)
@@ -67,6 +68,14 @@ Output following this JSON format:
     except json.JSONDecodeError as e:
       raise RuntimeError(f"Failed to get JSON response: {e}") from e
 class AnthropicModel(Model):
@@ -109,6 +118,25 @@ Text:
     return result.removesuffix(suffix).strip()
 supported_models: List[Model] = [
     Model("gpt-4o-2024-05-13"),
     Model("gpt-4-turbo-2024-04-09"),
@@ -121,6 +149,10 @@ supported_models: List[Model] = [
     Model("mistral-large-2402", provider="mistral"),
     Model("llama3-8b-8192", provider="groq"),
     Model("llama3-70b-8192", provider="groq"),
 ]

 """
 import json
+import os
 from typing import List
 import litellm
         "role": "user",
         "content": prompt
     }]
     try:
+      response = litellm.completion(model=self.provider + "/" +
+                                    self.name if self.provider else self.name,
+                                    api_key=self.api_key,
+                                    api_base=self.api_base,
+                                    messages=messages,
+                                    max_tokens=max_tokens,
+                                    **self._get_completion_kwargs())
       json_response = response.choices[0].message.content
       parsed_json = json.loads(json_response)
     except json.JSONDecodeError as e:
       raise RuntimeError(f"Failed to get JSON response: {e}") from e
+  def _get_completion_kwargs(self):
+    return {
+        # Ref: https://litellm.vercel.app/docs/completion/input#optional-fields # pylint: disable=line-too-long
+        "response_format": {
+            "type": "json_object"
+        }
+    }
 class AnthropicModel(Model):
     return result.removesuffix(suffix).strip()
+class EeveModel(Model):
+  def _get_completion_kwargs(self):
+    json_template = {
+        "type": "object",
+        "properties": {
+            "result": {
+                "type": "string"
+            }
+        }
+    }
+    return {
+        "extra_body": {
+            "guided_json": json.dumps(json_template),
+            "guided_decoding_backend": "lm-format-enforcer"
+        }
+    }
 supported_models: List[Model] = [
     Model("gpt-4o-2024-05-13"),
     Model("gpt-4-turbo-2024-04-09"),
     Model("mistral-large-2402", provider="mistral"),
     Model("llama3-8b-8192", provider="groq"),
     Model("llama3-70b-8192", provider="groq"),
+    EeveModel("yanolja/EEVE-Korean-Instruct-10.8B-v1.0",
+              provider="openai",
+              api_base=os.getenv("EEVE_API_BASE"),
+              api_key=os.getenv("EEVE_API_KEY")),
 ]