Spaces:

Omkar1806
/

code

Running

App Files Files Community

Omkar1806 commited on 20 days ago

Commit

746be7a

verified ·

1 Parent(s): 45730bd

Update env.py

Browse files

Files changed (1) hide show

env.py +21 -33

env.py CHANGED Viewed

@@ -2,43 +2,42 @@ import numpy as np
 import gymnasium as gym
 from gymnasium import spaces
-# --- UI LABELS (Ye labels app.py mang raha hai) ---
 URGENCY_LABELS = ["General", "Billing", "Security Breach"]
 ROUTING_LABELS = ["AI Auto-Reply", "Tech Support", "Legal"]
 RESOLUTION_LABELS = ["Archive", "Draft Reply", "Escalate to Human"]
-# --- Vocabulary & Encoding Configuration ---
 KEYWORD_VOCAB = [
-    "invoice", "payment", "overdue", "refund",          # billing
-    "hacked", "breach", "unauthorized", "password",     # security
-    "crash", "error", "bug", "slow",                    # tech
-    "lawsuit", "legal", "attorney", "sue",              # legal
-    "spam", "offer", "win", "free",                     # spam
-    "urgent", "critical", "angry", "threat",            # sentiment signals
 ]
 SENTIMENT_MAP = {"positive": 0, "neutral": 1, "negative": 2}
 CONTEXT_MAP = {"spam": 0, "billing": 1, "tech": 2, "security": 3, "legal": 4}
 OBS_DIM = len(KEYWORD_VOCAB) + len(SENTIMENT_MAP) + len(CONTEXT_MAP)
-# --- Environment Class ---
 class EmailTriageEnv(gym.Env):
     def __init__(self, task="all", batch=None, shuffle=True):
         super().__init__()
-        # Dataset ko import karna (app.py se load hoga)
         try:
             from app import EMAIL_DATASET
             dataset_to_use = EMAIL_DATASET
         except ImportError:
-            dataset_to_use = [] # Fallback agar dataset na mile
         if batch is not None:
-            self.email_batch = batch
         elif task != "all":
-            self.email_batch = [e for e in dataset_to_use if e.get("difficulty") == task]
         else:
-            self.email_batch = dataset_to_use
         self.shuffle = shuffle
         self.action_space = spaces.MultiDiscrete([3, 3, 3])
@@ -49,48 +48,37 @@ class EmailTriageEnv(gym.Env):
         kw_flags = np.array([1.0 if kw in email.get("keywords", []) else 0.0 for kw in KEYWORD_VOCAB])
         sent_idx = SENTIMENT_MAP.get(email.get("sentiment", "neutral"), 1)
         sentiment_vec = np.zeros(len(SENTIMENT_MAP)); sentiment_vec[sent_idx] = 1.0
         ctx_idx = CONTEXT_MAP.get(email.get("context", "spam"), 0)
         context_vec = np.zeros(len(CONTEXT_MAP)); context_vec[ctx_idx] = 1.0
         return np.concatenate([kw_flags, sentiment_vec, context_vec]).astype(np.float32)
     def reset(self, seed=None, options=None):
         super().reset(seed=seed)
         self._step_idx = 0
-        if not self.email_batch:
-            return np.zeros(OBS_DIM, dtype=np.float32), {}
-        obs = self._encode(self.email_batch[0])
-        return obs, {"description": self.email_batch[0].get("description", "")}
     def step(self, action):
-        email = self.email_batch[self._step_idx]
         correct = email["correct_actions"]
-        # Reward Logic (Score sudharne ke liye)
         reward = 0.0
         if correct[0] == 2 and action[0] != 2:
-            reward = -2.0  # Security missed penalty
         elif tuple(action) == correct:
             reward = 1.0
         elif action[0] == correct[0]:
             reward = 0.2
         self._step_idx += 1
-        terminated = self._step_idx >= len(self.email_batch)
-        # Next observation
-        if not terminated:
-            next_email = self.email_batch[self._step_idx]
-            obs = self._encode(next_email)
-        else:
-            obs = self._encode(email)
         info = {
             "description": email.get("description", ""),
             "correct_actions": correct,
             "raw_reward": reward
         }
         return obs, float(reward), terminated, False, info

 import gymnasium as gym
 from gymnasium import spaces
+# --- UI LABELS ---
 URGENCY_LABELS = ["General", "Billing", "Security Breach"]
 ROUTING_LABELS = ["AI Auto-Reply", "Tech Support", "Legal"]
 RESOLUTION_LABELS = ["Archive", "Draft Reply", "Escalate to Human"]
+# --- Vocabulary & Config ---
 KEYWORD_VOCAB = [
+    "invoice", "payment", "overdue", "refund",
+    "hacked", "breach", "unauthorized", "password",
+    "crash", "error", "bug", "slow",
+    "lawsuit", "legal", "attorney", "sue",
+    "spam", "offer", "win", "free",
+    "urgent", "critical", "angry", "threat",
 ]
 SENTIMENT_MAP = {"positive": 0, "neutral": 1, "negative": 2}
 CONTEXT_MAP = {"spam": 0, "billing": 1, "tech": 2, "security": 3, "legal": 4}
 OBS_DIM = len(KEYWORD_VOCAB) + len(SENTIMENT_MAP) + len(CONTEXT_MAP)
 class EmailTriageEnv(gym.Env):
     def __init__(self, task="all", batch=None, shuffle=True):
         super().__init__()
         try:
             from app import EMAIL_DATASET
             dataset_to_use = EMAIL_DATASET
         except ImportError:
+            dataset_to_use = []
+        # Fix: App.py needs '_queue' for the interface to work
         if batch is not None:
+            self._queue = batch
         elif task != "all":
+            self._queue = [e for e in dataset_to_use if e.get("difficulty") == task]
         else:
+            self._queue = dataset_to_use
         self.shuffle = shuffle
         self.action_space = spaces.MultiDiscrete([3, 3, 3])
         kw_flags = np.array([1.0 if kw in email.get("keywords", []) else 0.0 for kw in KEYWORD_VOCAB])
         sent_idx = SENTIMENT_MAP.get(email.get("sentiment", "neutral"), 1)
         sentiment_vec = np.zeros(len(SENTIMENT_MAP)); sentiment_vec[sent_idx] = 1.0
         ctx_idx = CONTEXT_MAP.get(email.get("context", "spam"), 0)
         context_vec = np.zeros(len(CONTEXT_MAP)); context_vec[ctx_idx] = 1.0
         return np.concatenate([kw_flags, sentiment_vec, context_vec]).astype(np.float32)
     def reset(self, seed=None, options=None):
         super().reset(seed=seed)
         self._step_idx = 0
+        if not self._queue: return np.zeros(OBS_DIM, dtype=np.float32), {}
+        obs = self._encode(self._queue[0])
+        return obs, {"description": self._queue[0].get("description", "")}
     def step(self, action):
+        email = self._queue[self._step_idx]
         correct = email["correct_actions"]
         reward = 0.0
+        # Critical Security Check
         if correct[0] == 2 and action[0] != 2:
+            reward = -2.0
         elif tuple(action) == correct:
             reward = 1.0
         elif action[0] == correct[0]:
             reward = 0.2
         self._step_idx += 1
+        terminated = self._step_idx >= len(self._queue)
+        obs = self._encode(email)
         info = {
             "description": email.get("description", ""),
             "correct_actions": correct,
             "raw_reward": reward
         }
         return obs, float(reward), terminated, False, info