Spaces:

100XZX001
/

CodeReview-Professional-Workflow

Sleeping

App Files Files Community

100XZX001 commited on 19 days ago

Commit

86c792b

verified ·

1 Parent(s): d089573

Create app.py

Browse files

Files changed (1) hide show

app.py +104 -0

app.py ADDED Viewed

	@@ -0,0 +1,104 @@

+# server/app.py – OpenEnv HTTP server
+import sys
+import os
+sys.path.insert(0, os.path.dirname(os.path.dirname(__file__)))
+from fastapi import FastAPI, HTTPException
+from environment import CodeReviewEnv
+from models import AnyAction, Observation, Reward, State, action_adapter
+app = FastAPI(title="Code Review Environment", version="1.0.0")
+env = CodeReviewEnv()
+# ----------------------------------------------------------------------
+# Health & metadata endpoints
+# ----------------------------------------------------------------------
+@app.get("/")
+def root():
+    print("[ROOT] Health check hit")
+    return {"status": "crazy good"}
+@app.get("/health")
+def health():
+    print("[HEALTH] Service is healthy")
+    return {"status": "healthy"}
+@app.get("/metadata")
+def metadata():
+    print("[METADATA] Requested")
+    return {
+        "name": "Code Review Professional Workflow",
+        "description": (
+            "Multi‑turn code review environment for professional‑level bug fixing. "
+            "The agent must inspect, test, lint, query documentation, and negotiate with "
+            "a simulated (persona‑driven) author to get a fix accepted. "
+            "Includes 25 bugs across 5 difficulty levels, AST‑based injection, "
+            "a reward‑shaping system (full/core profiles), and curriculum learning. "
+            "Designed for RL training (PPO, DPO, or any policy‑gradient method)."
+        )
+    }
+@app.get("/schema")
+def schema():
+    print("[SCHEMA] Requested")
+    return {
+        "action": AnyAction.model_json_schema(),
+        "observation": Observation.model_json_schema(),
+        "state": State.model_json_schema()
+    }
+@app.post("/mcp")
+def mcp():
+    print("[MCP] Ping received")
+    return {"jsonrpc": "2.0", "result": None}
+# ----------------------------------------------------------------------
+# Environment endpoints
+# ----------------------------------------------------------------------
+@app.post("/reset")
+def reset(task: str = "easy"):
+    try:
+        print(f"[RESET] Starting new episode | task={task}")
+        env.set_task(task)
+        obs = env.reset()
+        print(f"[RESET DONE] step={env._step_count}")
+        return obs.__dict__
+    except Exception as e:
+        print(f"[RESET ERROR] {e}")
+        raise HTTPException(status_code=400, detail=str(e))
+@app.post("/step")
+def step(action: dict):
+    try:
+        print(f"[STEP INPUT] {action}")
+        parsed_action = action_adapter.validate_python(action)
+        obs, reward, done, info = env.step(parsed_action)
+        print(f"[STEP OUTPUT] reward={reward.value:.4f} | done={done}")
+        return {
+            "observation": obs.__dict__,
+            "reward": reward.value,
+            "done": done,
+            "info": info
+        }
+    except Exception as e:
+        print(f"[STEP ERROR] {e}")
+        raise HTTPException(status_code=400, detail=str(e))
+@app.get("/state")
+def state():
+    print("[STATE] Requested")
+    return env._get_observation().__dict__
+# ----------------------------------------------------------------------
+# Main entry point (for local testing)
+# ----------------------------------------------------------------------
+if __name__ == "__main__":
+    import uvicorn
+    print("[SERVER START] Running on http://0.0.0.0:7860")
+    uvicorn.run(app, host="0.0.0.0", port=7860)