Spaces:

hiitsesh
/

openenv-hackathon

Running

App Files Files Community

hiitsesh commited on 14 days ago

Commit

0287ccf

1 Parent(s): 36ac8be

fix: refactor OpenAI client initialization and update API request handling

Browse files

Files changed (1) hide show

inference.py +14 -21

inference.py CHANGED Viewed

@@ -2,26 +2,13 @@ import os
 import json
 import re
 import requests
-from openai import OpenAI
 API_BASE_URL = os.getenv("API_BASE_URL", "https://api.openai.com/v1")
-API_KEY = os.getenv("HF_TOKEN") or os.getenv("API_KEY")
 MODEL_NAME = os.getenv("MODEL_NAME", "gpt-3.5-turbo")
 ENV_BASE_URL = "http://localhost:7860"
-# Initialize OpenAI client
-client = None
-if API_BASE_URL and API_KEY:
-    client = OpenAI(
-        base_url=API_BASE_URL,
-        api_key=API_KEY
-    )
-elif API_KEY:
-    client = OpenAI(api_key=API_KEY)
-else:
-    client = OpenAI(api_key="dummy_key")
 SYSTEM_PROMPT = """You are an elite AI agent controlling an industrial reverse-osmosis desalination plant.
 Your objective: Manage the trade-offs of fresh water production against energy costs and membrane degradation, while ensuring water_salinity NEVER exceeds 450 PPM and reservoir NEVER dries out.
 IMPORTANT: You MUST respond ONLY with valid JSON holding exactly two keys: "production_rate" (float 0.0 to 50.0) and "run_cleaning" (boolean).
@@ -134,16 +121,22 @@ def evaluate_baseline(task_id):
         error_msg = "null"
         try:
-            response = client.chat.completions.create(
-                model=MODEL_NAME,
-                messages=[
                     {"role": "system", "content": SYSTEM_PROMPT},
                     {"role": "user", "content": prompt}
                 ],
-                temperature=0.0,
-                max_tokens=150
-            )
-            llm_content = response.choices[0].message.content
             action = parse_action(llm_content)
         except Exception as e:
             error_msg = f"'{str(e)}'"

 import json
 import re
 import requests
 API_BASE_URL = os.getenv("API_BASE_URL", "https://api.openai.com/v1")
+API_KEY = os.getenv("HF_TOKEN") or os.getenv("API_KEY") or "dummy_key"
 MODEL_NAME = os.getenv("MODEL_NAME", "gpt-3.5-turbo")
 ENV_BASE_URL = "http://localhost:7860"
 SYSTEM_PROMPT = """You are an elite AI agent controlling an industrial reverse-osmosis desalination plant.
 Your objective: Manage the trade-offs of fresh water production against energy costs and membrane degradation, while ensuring water_salinity NEVER exceeds 450 PPM and reservoir NEVER dries out.
 IMPORTANT: You MUST respond ONLY with valid JSON holding exactly two keys: "production_rate" (float 0.0 to 50.0) and "run_cleaning" (boolean).
         error_msg = "null"
         try:
+            headers = {
+                "Authorization": f"Bearer {API_KEY}",
+                "Content-Type": "application/json"
+            }
+            payload = {
+                "model": MODEL_NAME,
+                "messages": [
                     {"role": "system", "content": SYSTEM_PROMPT},
                     {"role": "user", "content": prompt}
                 ],
+                "temperature": 0.0,
+                "max_tokens": 150
+            }
+            response = requests.post(f"{API_BASE_URL.rstrip('/')}/chat/completions", headers=headers, json=payload, timeout=30)
+            response.raise_for_status()
+            llm_content = response.json()["choices"][0]["message"]["content"]
             action = parse_action(llm_content)
         except Exception as e:
             error_msg = f"'{str(e)}'"