Spaces:

Astocoder
/

quant-gym

Running

App Files Files Community

Astocoder commited on 7 days ago

Commit

f23faaf

1 Parent(s): 4d24e1f

update changes

Browse files

Files changed (4) hide show

task1_grader.py +15 -5
task2_grader.py +20 -2
task3_grader.py +20 -2
server/environment.py +21 -1

task1_grader.py CHANGED Viewed

@@ -1,10 +1,20 @@
-def grade_task1(agent_action, observation):
     """
     Task 1: Fetch Market Data
-    Returns score strictly between 0 and 1
     """
-    # Simple scoring logic
-    score = 0.75
-    # You can add actual logic later, but this passes validation
     return score

+def grade_task1(action, observation):
     """
     Task 1: Fetch Market Data
+    Returns score based on whether price was retrieved
     """
+    score = 0.75  # Base score
+    # Check if observation has a price
+    if observation and observation.get('price', 0) > 0:
+        score = 0.95
+    else:
+        score = 0.55
+    # Ensure score is never 0.0 or 1.0
+    if score <= 0.0:
+        score = 0.01
+    if score >= 1.0:
+        score = 0.99
     return score

task2_grader.py CHANGED Viewed

@@ -1,7 +1,25 @@
-def grade_task2(agent_action, observation):
     """
     Task 2: News Sentiment Analysis
-    Returns score strictly between 0 and 1
     """
     score = 0.75
     return score

+def grade_task2(action, observation):
     """
     Task 2: News Sentiment Analysis
+    Returns score based on explanation quality
     """
     score = 0.75
+    # Check if agent provided explanation
+    if action and action.get('explanation'):
+        explanation = action.get('explanation', '')
+        if len(explanation) > 20:
+            score = 0.95
+        elif len(explanation) > 10:
+            score = 0.85
+        else:
+            score = 0.65
+    else:
+        score = 0.55
+    if score <= 0.0:
+        score = 0.01
+    if score >= 1.0:
+        score = 0.99
     return score

task3_grader.py CHANGED Viewed

@@ -1,7 +1,25 @@
-def grade_task3(agent_action, observation):
     """
     Task 3: Backtest Strategy
-    Returns score strictly between 0 and 1
     """
     score = 0.75
     return score

+def grade_task3(action, observation):
     """
     Task 3: Backtest Strategy
+    Returns score based on backtest results
     """
     score = 0.75
+    # Check if backtest results exist
+    if observation and observation.get('backtest_results'):
+        results = observation.get('backtest_results', {})
+        if results.get('sharpe_ratio', 0) > 1.0:
+            score = 0.95
+        elif results.get('sharpe_ratio', 0) > 0.5:
+            score = 0.85
+        else:
+            score = 0.65
+    else:
+        score = 0.55
+    if score <= 0.0:
+        score = 0.01
+    if score >= 1.0:
+        score = 0.99
     return score

server/environment.py CHANGED Viewed

@@ -27,6 +27,7 @@ class TradingEnvironment:
         self.shares = 0
         self.total_steps = len(self.prices)
         self.tasks_completed = []
         return self._get_observation()
     def step(self, action: AgentAction):
@@ -34,6 +35,14 @@ class TradingEnvironment:
         self.idx = min(self.idx + 1, self.total_steps - 1)
         price = self.prices[self.idx]
         if action.type == "BUY" and action.amount:
             cost = price * action.amount
             if cost <= self.cash:
@@ -48,6 +57,12 @@ class TradingEnvironment:
         return self._get_observation()
     def _get_observation(self):
         price = self.prices[self.idx]
         news_idx = self.idx % len(self.news)
@@ -74,5 +89,10 @@ class TradingEnvironment:
             "current_step": self.idx,
             "total_steps": self.total_steps,
             "observation": self._get_observation().dict(),
-            "tasks_completed": self.tasks_completed
         }

         self.shares = 0
         self.total_steps = len(self.prices)
         self.tasks_completed = []
+        self.task_scores = {}  # Track scores for each task
         return self._get_observation()
     def step(self, action: AgentAction):
         self.idx = min(self.idx + 1, self.total_steps - 1)
         price = self.prices[self.idx]
+        # Track which task is being attempted
+        if action.type == "GET_PRICE":
+            self._complete_task("task1", 0.85)
+        elif action.type == "GET_NEWS" or (action.explanation and len(action.explanation) > 5):
+            self._complete_task("task2", 0.85)
+        elif action.type == "BACKTEST":
+            self._complete_task("task3", 0.85)
         if action.type == "BUY" and action.amount:
             cost = price * action.amount
             if cost <= self.cash:
         return self._get_observation()
+    def _complete_task(self, task_id: str, score: float):
+        """Mark a task as completed with a score"""
+        if task_id not in self.tasks_completed:
+            self.tasks_completed.append(task_id)
+            self.task_scores[task_id] = score
     def _get_observation(self):
         price = self.prices[self.idx]
         news_idx = self.idx % len(self.news)
             "current_step": self.idx,
             "total_steps": self.total_steps,
             "observation": self._get_observation().dict(),
+            "tasks_completed": self.tasks_completed,
+            "task_scores": self.task_scores
         }
+    def get_task_score(self, task_id: str) -> float:
+        """Return score for a specific task (for grader integration)"""
+        return self.task_scores.get(task_id, 0.75)