Spaces:

DEVessi
/

devops_sandbox

Running

App Files Files Community

DEVessi commited on 4 days ago

Commit

37b054e

verified ·

1 Parent(s): e9c3076

Upload folder using huggingface_hub

Browse files

Files changed (6) hide show

.gitignore +34 -0
Dockerfile +69 -69
inference.py +47 -65
move.py +17 -0
server/# Self-Healing DevOps Sandbox - a Huggin.txt +10 -0
server/devops_sandbox_environment.py +11 -3

.gitignore ADDED Viewed

	@@ -0,0 +1,34 @@

+# Virtual environments
+venv/
+.venv/
+env/
+ENV/
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+*.egg
+*.egg-info/
+.eggs/
+build/
+dist/
+# Node
+node_modules/
+npm-debug.log
+yarn-error.log
+# IDEs and Editors
+.vscode/
+.idea/
+*.swp
+*.swo
+.DS_Store
+# Application Specific / Temp
+*.log
+validation_output.txt
+_cli_path.txt
+_path.txt

Dockerfile CHANGED Viewed

@@ -1,69 +1,69 @@
-# Hugging Face Spaces Dockerfile for Self-Healing DevOps Sandbox
-FROM ghcr.io/meta-pytorch/openenv-base:latest AS builder
-USER root
-# Install Node.js 20 & utilities needed by the sandbox
-RUN apt-get update && \
-    apt-get install -y --no-install-recommends git curl bash && \
-    curl -fsSL https://deb.nodesource.com/setup_20.x | bash - && \
-    apt-get install -y nodejs && \
-    rm -rf /var/lib/apt/lists/*
-WORKDIR /server_app
-# Copy environment code
-COPY . /server_app/env
-WORKDIR /server_app/env
-# Ensure uv is available
-RUN if ! command -v uv >/dev/null 2>&1; then \
-        curl -LsSf https://astral.sh/uv/install.sh | sh && \
-        mv /root/.local/bin/uv /usr/local/bin/uv && \
-        mv /root/.local/bin/uvx /usr/local/bin/uvx; \
-    fi
-# Install dependencies using uv sync
-RUN --mount=type=cache,target=/root/.cache/uv \
-    if [ -f uv.lock ]; then \
-        uv sync --no-install-project --no-editable; \
-    else \
-        uv sync --no-editable; \
-    fi
-# Final runtime stage
-FROM ghcr.io/meta-pytorch/openenv-base:latest
-USER root
-# Re-install Node.js 20 in the runtime image
-RUN apt-get update && \
-    apt-get install -y --no-install-recommends git curl bash psmisc && \
-    curl -fsSL https://deb.nodesource.com/setup_20.x | bash - && \
-    apt-get install -y nodejs && \
-    rm -rf /var/lib/apt/lists/*
-WORKDIR /server_app
-# Copy the virtual environment from builder
-COPY --from=builder /server_app/env/.venv /server_app/.venv
-# Copy the environment code
-COPY --from=builder /server_app/env /server_app/env
-# Ensure the backup folder for reset() is available and perfectly clean
-# The environment script will do `cp -r /app_backup/* /app/` during every reset
-RUN mkdir -p /app_backup && \
-    cp -r /server_app/env/simulated_app/* /app_backup/ && \
-    mkdir -p /app && \
-    chmod -R 777 /app /app_backup
-# Export Paths
-ENV PATH="/server_app/.venv/bin:$PATH"
-ENV PYTHONPATH="/server_app/env:$PYTHONPATH"
-# Run the FastAPI server on port 7860 for HuggingFace Spaces
-ENV ENABLE_WEB_INTERFACE=true
-EXPOSE 7860
-CMD ["sh", "-c", "cd /server_app/env && uvicorn server.app:app --host 0.0.0.0 --port 7860"]

+# Hugging Face Spaces Dockerfile for Self-Healing DevOps Sandbox
+FROM ghcr.io/meta-pytorch/openenv-base:latest AS builder
+USER root
+# Install Node.js 20 & utilities needed by the sandbox
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends git curl bash && \
+    curl -fsSL https://deb.nodesource.com/setup_20.x | bash - && \
+    apt-get install -y nodejs && \
+    rm -rf /var/lib/apt/lists/*
+WORKDIR /server_app
+# Copy environment code
+COPY . /server_app/env
+WORKDIR /server_app/env
+# Ensure uv is available
+RUN if ! command -v uv >/dev/null 2>&1; then \
+        curl -LsSf https://astral.sh/uv/install.sh | sh && \
+        mv /root/.local/bin/uv /usr/local/bin/uv && \
+        mv /root/.local/bin/uvx /usr/local/bin/uvx; \
+    fi
+# Install dependencies using uv sync
+RUN --mount=type=cache,target=/root/.cache/uv \
+    if [ -f uv.lock ]; then \
+        uv sync --no-install-project --no-editable; \
+    else \
+        uv sync --no-editable; \
+    fi
+# Final runtime stage
+FROM ghcr.io/meta-pytorch/openenv-base:latest
+USER root
+# Re-install Node.js 20 in the runtime image
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends git curl bash psmisc && \
+    curl -fsSL https://deb.nodesource.com/setup_20.x | bash - && \
+    apt-get install -y nodejs && \
+    rm -rf /var/lib/apt/lists/*
+WORKDIR /server_app
+# Copy the virtual environment from builder
+COPY --from=builder /server_app/env/.venv /server_app/.venv
+# Copy the environment code
+COPY --from=builder /server_app/env /server_app/env
+# Ensure the backup folder for reset() is available and perfectly clean
+# The environment script will do `cp -r /app_backup/* /app/` during every reset
+RUN mkdir -p /app_backup && \
+    cp -r /server_app/env/simulated_app/* /app_backup/ && \
+    mkdir -p /app && \
+    chmod -R 777 /app /app_backup
+# Export Paths
+ENV PATH="/server_app/.venv/bin:$PATH"
+ENV PYTHONPATH="/server_app/env:$PYTHONPATH"
+# Run the FastAPI server on port 7860 for HuggingFace Spaces
+ENV ENABLE_WEB_INTERFACE=true
+EXPOSE 7860
+CMD ["sh", "-c", "cd /server_app/env && uvicorn server.app:app --host 0.0.0.0 --port 7860"]

inference.py CHANGED Viewed

@@ -10,14 +10,6 @@ Baseline inference script for the Self-Healing DevOps Sandbox.
 Uses an LLM (via the OpenAI-compatible API) to diagnose and fix a broken
 Node.js backend running inside a Docker container.
-Usage:
-    export OPENAI_API_KEY="sk-..."
-    python baseline.py
-    # Or with a custom endpoint (e.g., local vLLM):
-    export OPENAI_BASE_URL="http://localhost:8080/v1"
-    python baseline.py
 """
 import json
@@ -30,14 +22,20 @@ except ImportError:
     print("ERROR: 'openai' package is required. Install with: pip install openai")
     sys.exit(1)
-from devops_sandbox import BashAction, DevopsSandboxEnv
 # ---------------------------------------------------------------------------
 # Configuration
 # ---------------------------------------------------------------------------
 ENV_URL = os.getenv("DEVOPS_SANDBOX_URL", "http://localhost:8000")
-MODEL = os.getenv("OPENAI_MODEL", "gpt-4o-mini")
-MAX_TURNS = int(os.getenv("MAX_TURNS", "30"))
 SYSTEM_PROMPT = """\
 You are an expert DevOps engineer and Node.js developer.
@@ -59,10 +57,8 @@ EXPECTED FINAL STATE:
 - GET /api/data → 200 with JSON containing "records" array
 """
 def extract_command(llm_response: str) -> str:
     """Extract a bash command from the LLM's response (JSON or raw text)."""
-    # Try JSON parsing first
     try:
         data = json.loads(llm_response.strip())
         if isinstance(data, dict) and "command" in data:
@@ -70,10 +66,9 @@ def extract_command(llm_response: str) -> str:
     except (json.JSONDecodeError, TypeError):
         pass
-    # Try extracting from markdown code block
     if "```" in llm_response:
         lines = llm_response.split("```")
-        for block in lines[1::2]:  # odd indices are code blocks
             code = block.strip()
             if code.startswith("json"):
                 code = code[4:].strip()
@@ -91,36 +86,29 @@ def extract_command(llm_response: str) -> str:
                 if first_line:
                     return first_line
-    # Fallback: treat entire response as a command
     cmd = llm_response.strip().strip("`").strip()
     if cmd.startswith("{"):
-        # One more try
         try:
             return json.loads(cmd)["command"]
         except Exception:
             pass
     return cmd
 def main():
-    print("=" * 60)
-    print(" Self-Healing DevOps Sandbox — Baseline Agent")
-    print("=" * 60)
-    client = OpenAI()
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
     with DevopsSandboxEnv(base_url=ENV_URL).sync() as env:
-        # Reset the environment
-        print("\n[*] Resetting environment...")
         result = env.reset()
         obs = result.observation
-        print(f"\n[INIT] Task prompt:\n{obs.stdout[:500]}...")
-        print(f"[INIT] Score: {obs.grader_score} | Feedback: {obs.grader_feedback}")
-        # Add initial observation to messages
         messages.append({
             "role": "user",
             "content": (
@@ -132,72 +120,66 @@ def main():
             ),
         })
-        for turn in range(1, MAX_TURNS + 1):
-            print(f"\n{'─' * 40}")
-            print(f"Turn {turn}/{MAX_TURNS}")
-            print(f"{'─' * 40}")
-            # Get LLM response
             try:
                 response = client.chat.completions.create(
-                    model=MODEL,
                     messages=messages,
                     temperature=0.2,
                     max_tokens=256,
                 )
                 llm_text = response.choices[0].message.content or ""
             except Exception as e:
-                print(f"[ERROR] LLM call failed: {e}")
                 break
-            # Extract command
             command = extract_command(llm_text)
             if not command:
-                print("[WARN] Could not extract command from LLM response")
                 command = "ls -la /app"
-            print(f"[CMD] {command}")
-            # Execute in environment
-            result = env.step(BashAction(command=command))
-            obs = result.observation
-            stdout_preview = obs.stdout[:300] if obs.stdout else "(empty)"
-            stderr_preview = obs.stderr[:200] if obs.stderr else "(none)"
-            print(f"[OUT] {stdout_preview}")
-            if obs.stderr:
-                print(f"[ERR] {stderr_preview}")
-            print(f"[SCORE] {obs.grader_score:.2f} | {obs.grader_feedback}")
-            # Add to conversation
             messages.append({"role": "assistant", "content": llm_text})
             messages.append({
                 "role": "user",
                 "content": (
                     f"Command output:\n"
-                    f"stdout:\n```\n{obs.stdout}\n```\n"
-                    f"stderr:\n```\n{obs.stderr}\n```\n"
-                    f"Current score: {obs.grader_score}/1.0\n"
-                    f"Grader feedback: {obs.grader_feedback}\n\n"
                     f"What command should I run next?"
                 ),
             })
-            # Check if done
-            if result.done:
-                print(f"\n{'=' * 60}")
-                if obs.grader_score >= 1.0:
-                    print(" ✅ ALL BUGS FIXED — PERFECT SCORE!")
-                else:
-                    print(f" Episode ended. Final score: {obs.grader_score:.2f}/1.0")
-                print(f"{'=' * 60}")
                 break
-        else:
-            print(f"\n[!] Max turns ({MAX_TURNS}) reached.")
-            print(f"    Final score: {obs.grader_score:.2f}/1.0")
-    print("\n[*] Done.")
 if __name__ == "__main__":
     main()

 Uses an LLM (via the OpenAI-compatible API) to diagnose and fix a broken
 Node.js backend running inside a Docker container.
 """
 import json
     print("ERROR: 'openai' package is required. Install with: pip install openai")
     sys.exit(1)
+from client import DevopsSandboxEnv
+from models import BashAction
 # ---------------------------------------------------------------------------
 # Configuration
 # ---------------------------------------------------------------------------
+API_BASE_URL = os.getenv("API_BASE_URL") or "https://router.huggingface.co/v1"
+MODEL_NAME = os.getenv("MODEL_NAME") or "gpt-4o-mini"
+HF_TOKEN = os.getenv("HF_TOKEN") or os.getenv("API_KEY")
 ENV_URL = os.getenv("DEVOPS_SANDBOX_URL", "http://localhost:8000")
+TASK_NAME = os.getenv("MY_ENV_V4_TASK", "devops_sandbox")
+BENCHMARK = os.getenv("MY_ENV_V4_BENCHMARK", "devops_sandbox")
+MAX_TURNS = int(os.getenv("MAX_TURNS", "8"))
 SYSTEM_PROMPT = """\
 You are an expert DevOps engineer and Node.js developer.
 - GET /api/data → 200 with JSON containing "records" array
 """
 def extract_command(llm_response: str) -> str:
     """Extract a bash command from the LLM's response (JSON or raw text)."""
     try:
         data = json.loads(llm_response.strip())
         if isinstance(data, dict) and "command" in data:
     except (json.JSONDecodeError, TypeError):
         pass
     if "```" in llm_response:
         lines = llm_response.split("```")
+        for block in lines[1::2]:
             code = block.strip()
             if code.startswith("json"):
                 code = code[4:].strip()
                 if first_line:
                     return first_line
     cmd = llm_response.strip().strip("`").strip()
     if cmd.startswith("{"):
         try:
             return json.loads(cmd)["command"]
         except Exception:
             pass
     return cmd
 def main():
+    if not HF_TOKEN:
+        pass # we can let it fail or use empty key depending on endpoint
+    client = OpenAI(api_key=HF_TOKEN or "dummy_key", base_url=API_BASE_URL)
+    # Note: openenv evaluation specifically needs exactly 3 things: [START], [STEP] logs, [END]
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
     with DevopsSandboxEnv(base_url=ENV_URL).sync() as env:
         result = env.reset()
         obs = result.observation
+        print(f"[START] task={TASK_NAME} env={BENCHMARK} model={MODEL_NAME}", flush=True)
         messages.append({
             "role": "user",
             "content": (
             ),
         })
+        rewards = []
+        is_done = False
+        steps_taken = 0
+        final_score = 0.0
+        for turn in range(1, MAX_TURNS + 1):
             try:
                 response = client.chat.completions.create(
+                    model=MODEL_NAME,
                     messages=messages,
                     temperature=0.2,
                     max_tokens=256,
                 )
                 llm_text = response.choices[0].message.content or ""
             except Exception as e:
+                err_msg = str(e).replace('"', "'")
+                # Need to emit an empty step on failure? Usually not, just end.
                 break
             command = extract_command(llm_text)
             if not command:
                 command = "ls -la /app"
+            error_msg = "null"
+            try:
+                result = env.step(BashAction(command=command))
+                obs = result.observation
+            except Exception as e:
+                obs = env.state  # Mock failed obs
+                error_msg = str(e).replace('\n', ' ')
+            steps_taken += 1
+            reward_val = obs.reward if hasattr(obs, 'reward') else getattr(obs, 'grader_score', 0.0)
+            rewards.append(f"{reward_val:.2f}")
+            is_done = result.done if hasattr(result, 'done') else getattr(obs, 'done', False)
+            done_str = "true" if is_done else "false"
+            action_str = command.replace('\n', ' ; ')
+            print(f"[STEP] step={steps_taken} action={action_str} reward={reward_val:.2f} done={done_str} error={error_msg}", flush=True)
             messages.append({"role": "assistant", "content": llm_text})
             messages.append({
                 "role": "user",
                 "content": (
                     f"Command output:\n"
+                    f"stdout:\n```\n{getattr(obs, 'stdout', '')}\n```\n"
+                    f"stderr:\n```\n{getattr(obs, 'stderr', '')}\n```\n"
+                    f"Current score: {getattr(obs, 'grader_score', 0.0)}/1.0\n"
+                    f"Grader feedback: {getattr(obs, 'grader_feedback', '')}\n\n"
                     f"What command should I run next?"
                 ),
             })
+            final_score = getattr(obs, 'grader_score', 0.0)
+            if getattr(obs, 'grader_score', 0.0) >= 1.0 or getattr(obs, 'done', False) or result.done:
                 break
+        success_str = "true" if final_score >= 1.0 else "false"
+        rewards_str = ",".join(rewards) if rewards else "0.00"
+        print(f"[END] success={success_str} steps={steps_taken} score={final_score:.2f} rewards={rewards_str}", flush=True)
 if __name__ == "__main__":
     main()

move.py ADDED Viewed

	@@ -0,0 +1,17 @@

+import os
+import shutil
+src = r"e:\programs2\openenv(RL)\devops_sandbox"
+dst = r"e:\programs2\openenv(RL)"
+for item in os.listdir(src):
+    s = os.path.join(src, item)
+    d = os.path.join(dst, item)
+    if os.path.exists(d):
+        if os.path.isdir(d):
+            shutil.rmtree(d, ignore_errors=True)
+        else:
+            os.remove(d)
+    shutil.move(s, d)
+print("Moved successfully")

server/# Self-Healing DevOps Sandbox - a Huggin.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+# Self-Healing DevOps Sandbox - a Hugging Face Space by DEVessi
+# https://huggingface.co/[Spaces](https://huggingface.co/spaces)https://huggingface.co/[DEVessi](https://huggingface.co/DEVessi) DEVessi / [devops_sandbox](https://huggingface.co/spaces/DEVessi/devops_sandbox) like 0 Building
+[Spaces](https://huggingface.co/spaces)
+[DEVessi](https://huggingface.co/DEVessi)
+[devops_sandbox](https://huggingface.co/spaces/DEVessi/devops_sandbox)
+[App](https://huggingface.co/spaces/DEVessi/devops_sandbox)
+[Files Files](https://huggingface.co/spaces/DEVessi/devops_sandbox/tree/main)
+[Community](https://huggingface.co/spaces/DEVessi/devops_sandbox/discussions)

server/devops_sandbox_environment.py CHANGED Viewed

@@ -209,11 +209,19 @@ class DevOpsSandbox(Environment):
     def _reset_filesystem(self) -> None:
         """Replace the current working /app with the pristine /app_backup."""
         # Ensure we don't accidentally wipe out the whole host on windows if paths are wrong
-        if os.path.exists(self._app_dir):
-            shutil.rmtree(self._app_dir, ignore_errors=True)
         os.makedirs(self._app_dir, exist_ok=True)
         # Copy from backup to app dir
         if os.path.exists(self._app_backup_dir):
             for item in os.listdir(self._app_backup_dir):

     def _reset_filesystem(self) -> None:
         """Replace the current working /app with the pristine /app_backup."""
         # Ensure we don't accidentally wipe out the whole host on windows if paths are wrong
         os.makedirs(self._app_dir, exist_ok=True)
+        # Clean contents of /app instead of deleting /app itself
+        for item in os.listdir(self._app_dir):
+            item_path = os.path.join(self._app_dir, item)
+            if os.path.isdir(item_path):
+                shutil.rmtree(item_path, ignore_errors=True)
+            else:
+                try:
+                    os.remove(item_path)
+                except OSError:
+                    pass
         # Copy from backup to app dir
         if os.path.exists(self._app_backup_dir):
             for item in os.listdir(self._app_backup_dir):