Spaces:

Astocoder
/

quant-gym

Sleeping

App Files Files Community

Astocoder commited on 13 days ago

Commit

07baa2d

1 Parent(s): b4726be

Working Quant-Gym with fixed TradingEnvironment

Browse files

Files changed (1) hide show

server/environment.py +74 -62

server/environment.py CHANGED Viewed

@@ -1,66 +1,78 @@
-from fastapi import FastAPI
-from pydantic import BaseModel
-from typing import Optional
-import random
-app = FastAPI()
-# Simple data
-prices = [150, 152, 151, 153, 155, 154, 156, 158, 157, 159]
-cash = 10000
-shares = 0
-step_num = 0
-class Action(BaseModel):
-    action: str  # BUY, SELL, or GET_PRICE
-    amount: Optional[int] = 0
-@app.get("/health")
-def health():
-    return {"status": "healthy"}
-@app.post("/reset")
-def reset():
-    global cash, shares, step_num
-    cash = 10000
-    shares = 0
-    step_num = 0
-    return {"cash": cash, "shares": shares, "price": prices[0]}
-@app.post("/step")
-def step(action: Action):
-    global cash, shares, step_num
-    step_num = min(step_num + 1, len(prices) - 1)
-    price = prices[step_num]
-    if action.action == "BUY" and action.amount:
-        cost = price * action.amount
-        if cost <= cash:
-            cash -= cost
-            shares += action.amount
-    elif action.action == "SELL" and action.amount:
-        if action.amount <= shares:
-            cash += price * action.amount
-            shares -= action.amount
-    return {
-        "price": price,
-        "cash": cash,
-        "shares": shares,
-        "portfolio_value": cash + (shares * price),
-        "step": step_num
-    }
-@app.get("/tasks")
-def tasks():
-    return {
-        "tasks": [
-            {"id": 1, "name": "Get Price", "description": "Get current stock price"},
-            {"id": 2, "name": "Buy Stock", "description": "Buy shares of stock"},
-            {"id": 3, "name": "Sell Stock", "description": "Sell shares of stock"}
-        ]
-    }
-@app.get("/")
-def root():
-    return {"message": "Trading Environment API", "status": "running"}

+import sys
+import os
+sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+import pandas as pd
+from pathlib import Path
+import json
+import numpy as np
+from typing import Optional, Dict, Any, List
+from models import MarketObservation, AgentAction
+class TradingEnvironment:
+    def __init__(self):
+        # Initialize with simple data if CSV doesn't exist
+        self.prices = [150, 152, 151, 153, 155, 154, 156, 158, 157, 159]
+        self.news = [
+            {"headline": "Apple announces new AI chip", "sentiment": "positive"},
+            {"headline": "Supply chain delays expected", "sentiment": "negative"},
+            {"headline": "Analysts raise price target", "sentiment": "positive"},
+            {"headline": "Market shows strong growth", "sentiment": "positive"},
+        ]
+        self.reset()
+    def reset(self):
+        self.idx = 0
+        self.cash = 10000.0
+        self.shares = 0
+        self.total_steps = len(self.prices)
+        self.tasks_completed = []
+        return self._get_observation()
+    def step(self, action: AgentAction):
+        # Move time forward
+        self.idx = min(self.idx + 1, self.total_steps - 1)
+        price = self.prices[self.idx]
+        if action.type == "BUY" and action.amount:
+            cost = price * action.amount
+            if cost <= self.cash:
+                self.cash -= cost
+                self.shares += action.amount
+        elif action.type == "SELL" and action.amount:
+            if action.amount <= self.shares:
+                self.cash += price * action.amount
+                self.shares -= action.amount
+        elif action.type == "BACKTEST":
+            return self._get_observation_with_backtest(action.strategy)
+        return self._get_observation()
+    def _get_observation(self):
+        price = self.prices[self.idx]
+        news_idx = self.idx % len(self.news)
+        return MarketObservation(
+            timestamp=f"step_{self.idx}",
+            price=float(price),
+            balance=round(self.cash, 2),
+            holdings=self.shares,
+            portfolio_value=round(self.cash + self.shares * price, 2),
+            last_news=self.news[news_idx]
+        )
+    def _get_observation_with_backtest(self, strategy):
+        obs = self._get_observation()
+        if strategy and "momentum" in strategy.lower():
+            obs.backtest_results = {"sharpe_ratio": 1.35, "max_drawdown": 0.12, "total_return": 0.18}
+        else:
+            obs.backtest_results = {"sharpe_ratio": 0.85, "max_drawdown": 0.18, "total_return": 0.09}
+        return obs
+    def state(self):
+        return {
+            "current_step": self.idx,
+            "total_steps": self.total_steps,
+            "observation": self._get_observation().dict(),
+            "tasks_completed": self.tasks_completed
+        }