Spaces:

chipling
/

api

Running

App Files Files Community

chipling commited on 5 days ago

Commit

f6ab7af

verified ·

1 Parent(s): 8f054a9

Update models/text/deepinfra/main.py

Browse files

Files changed (1) hide show

models/text/deepinfra/main.py +77 -51

models/text/deepinfra/main.py CHANGED Viewed

@@ -4,7 +4,6 @@ import asyncio
 import json
 class OFFDeepInfraAPI:
     headers = {
         'Accept-Language': 'en-US,en;q=0.9,ja;q=0.8',
         'Connection': 'keep-alive',
@@ -26,70 +25,97 @@ class OFFDeepInfraAPI:
         self.base_url = "https://api.deepinfra.com/v1/openai/chat/completions"
     def get_model_list(self):
-       models = ['meta-llama/Llama-3.3-70B-Instruct-Turbo', 'deepseek-ai/DeepSeek-R1-Turbo', 'deepseek-ai/DeepSeek-R1-Distill-Llama-70B', 'deepseek-ai/DeepSeek-R1-Distill-Qwen-32B']
-       return models
     async def generate(self, json_data: dict):
         json_data['stream_options'] = {
             'include_usage': True,
             'continuous_usage_stats': True,
         }
         chunk_id = "chipling-deepinfraoff-" + "".join(random.choices("0123456789abcdef", k=32))
         created = int(asyncio.get_event_loop().time())
-        total_tokens = 0
         try:
             async with httpx.AsyncClient(timeout=None) as client:
                 async with client.stream(
                     "POST",
-                    "https://api.deepinfra.com/v1/openai/chat/completions",
                     headers=OFFDeepInfraAPI.headers,
                     json=json_data
-                ) as request_ctx:
-                    print(request_ctx.status_code)
-                    if request_ctx.status_code == 200:
-                        async for line in request_ctx.aiter_lines():
-                            if line:
-                                if line.startswith('0:'):
-                                    # Clean up the text and properly escape JSON characters
-                                    text = line[2:].strip()
-                                    if text.startswith('"') and text.endswith('"'):
-                                        text = text[1:-1]
-                                    text = text.replace('\\n', '\n').replace('\\', '')
-                                    response = {
-                                        "id": chunk_id,
-                                        "object": "chat.completion.chunk",
-                                        "created": created,
-                                        "model": json_data.get("model", "deepseek-r1-distill-llama-70b"),
-                                        "choices": [{
-                                            "index": 0,
-                                            "text": text,
-                                            "logprobs": None,
-                                            "finish_reason": None
-                                        }],
-                                        "usage": None
-                                    }
-                                    yield f"data: {json.dumps(response)}\n\n"
-                                    total_tokens += 1
-                                elif line.startswith('d:'):
-                                    final = {
-                                        "id": chunk_id,
-                                        "object": "chat.completion.chunk",
-                                        "created": created,
-                                        "model": json_data.get("model", "deepseek-r1-distill-llama-70b"),
-                                        "choices": [],
-                                        "usage": {
-                                            "prompt_tokens": len(messages),
-                                            "completion_tokens": total_tokens,
-                                            "total_tokens": len(messages) + total_tokens
-                                        }
-                                    }
-                                    yield f"data: {json.dumps(final)}\n\n"
-                                    yield "data: [DONE]\n\n"
                         return
-                    else:
-                        yield f"data: [Unexpected status code: {request_ctx.status_code}]\n\n"
         except Exception as e:
-            yield f"data: [Connection error: {str(e)}]\n\n"

 import json
 class OFFDeepInfraAPI:
     headers = {
         'Accept-Language': 'en-US,en;q=0.9,ja;q=0.8',
         'Connection': 'keep-alive',
         self.base_url = "https://api.deepinfra.com/v1/openai/chat/completions"
     def get_model_list(self):
+        return [
+            'meta-llama/Llama-3.3-70B-Instruct-Turbo',
+            'deepseek-ai/DeepSeek-R1-Turbo',
+            'deepseek-ai/DeepSeek-R1-Distill-Llama-70B',
+            'deepseek-ai/DeepSeek-R1-Distill-Qwen-32B'
+        ]
     async def generate(self, json_data: dict):
+        json_data['stream'] = True  # Ensure stream is enabled
         json_data['stream_options'] = {
             'include_usage': True,
             'continuous_usage_stats': True,
         }
         chunk_id = "chipling-deepinfraoff-" + "".join(random.choices("0123456789abcdef", k=32))
         created = int(asyncio.get_event_loop().time())
+        total_completion_tokens = 0
+        model_name = json_data.get("model", "unknown")
         try:
             async with httpx.AsyncClient(timeout=None) as client:
                 async with client.stream(
                     "POST",
+                    self.base_url,
                     headers=OFFDeepInfraAPI.headers,
                     json=json_data
+                ) as response:
+                    if response.status_code != 200:
+                        yield f"data: [Unexpected status code: {response.status_code}]\n\n"
                         return
+                    async for line in response.aiter_lines():
+                        if not line or not line.startswith("data:"):
+                            continue
+                        data_str = line.removeprefix("data:").strip()
+                        if data_str == "[DONE]":
+                            yield "data: [DONE]\n\n"
+                            return
+                        try:
+                            data = json.loads(data_str)
+                            delta = data["choices"][0].get("delta", {})
+                            content = delta.get("content", "")
+                            finish_reason = data["choices"][0].get("finish_reason", None)
+                            if content or finish_reason:
+                                transformed = {
+                                    "id": chunk_id,
+                                    "object": "chat.completion.chunk",
+                                    "created": created,
+                                    "choices": [{
+                                        "index": 0,
+                                        "text": content,
+                                        "logprobs": None,
+                                        "finish_reason": finish_reason,
+                                        "delta": {
+                                            "token_id": None,
+                                            "role": delta.get("role", "assistant"),
+                                            "content": content,
+                                            "tool_calls": delta.get("tool_calls"),
+                                        }
+                                    }],
+                                    "model": model_name,
+                                    "usage": None
+                                }
+                                yield f"data: {json.dumps(transformed)}\n\n"
+                            # Update usage stats
+                            usage = data.get("usage")
+                            if usage:
+                                total_completion_tokens = usage.get("completion_tokens", total_completion_tokens)
+                        except json.JSONDecodeError:
+                            continue
+                    # Final usage chunk
+                    final = {
+                        "id": chunk_id,
+                        "object": "chat.completion.chunk",
+                        "created": created,
+                        "choices": [],
+                        "model": model_name,
+                        "usage": {
+                            "prompt_tokens": 0,
+                            "completion_tokens": total_completion_tokens,
+                            "total_tokens": total_completion_tokens
+                        }
+                    }
+                    yield f"data: {json.dumps(final)}\n\n"
+                    yield "data: [DONE]\n\n"
         except Exception as e:
+            yield f"data: [Connection error: {str(e)}]\n\n"