From 413951bf98c79215015a54b39ff103c59db9485f Mon Sep 17 00:00:00 2001
From: Aaron Goldsmith <aargoldsmith@gmail.com>
Date: Sat, 21 Mar 2026 09:11:21 -0700
Subject: [PATCH 1/3] Add Docker sandbox for isolated agent execution

Adds container lifecycle management (create/destroy/set sandbox),
sandbox-aware command routing, and CLI --sandbox flag. Includes
review fixes: bind-mount working_dir, check docker start return
code, fail closed on missing sandbox, use sh -lc for compatibility,
expose get_current_sandbox() public getter.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 src/mobius/cli.py             |   3 +
 src/mobius/config.py          |  10 +++
 src/mobius/orchestrator.py    |  23 ++++++-
 src/mobius/providers/tools.py | 125 ++++++++++++++++++++++++++++++++--
 src/mobius/runner.py          |  15 ++--
 5 files changed, 165 insertions(+), 11 deletions(-)

diff --git a/src/mobius/cli.py b/src/mobius/cli.py
index 84e4ddc..6dc3108 100644
--- a/src/mobius/cli.py
+++ b/src/mobius/cli.py
@@ -103,6 +103,7 @@ def run(
     task: str = typer.Argument(..., help="The task for agents to compete on"),
     n: int = typer.Option(None, "--agents", "-n", help="Number of competing agents"),
     no_ui: bool = typer.Option(False, "--no-ui", help="Disable live terminal UI"),
+    sandbox: bool = typer.Option(False, "--sandbox", help="Run agents in Docker sandbox"),
     verbose: bool = typer.Option(False, "--verbose", "-v"),
 ):
     """Run a competition: select agents, execute in parallel, judge outputs."""
@@ -111,6 +112,8 @@ def run(
 
     if n:
         config.swarm_size = n
+    if sandbox:
+        config.sandbox_enabled = True
 
     agent_count = registry.count_agents()
     if agent_count == 0:
diff --git a/src/mobius/config.py b/src/mobius/config.py
index f90fbba..126fe60 100644
--- a/src/mobius/config.py
+++ b/src/mobius/config.py
@@ -24,6 +24,12 @@ class MobiusConfig(BaseModel):
     agent_max_turns: int = 10
     agent_budget_usd: float = 0.05
 
+    # Sandbox
+    sandbox_enabled: bool = False
+    sandbox_image: str = "python:3.12-slim"
+    sandbox_memory_limit: str = "512m"
+    sandbox_network: bool = False  # no network access by default
+
     # Judge
     judge_models: list[dict[str, str]] = [
         {"provider": "anthropic", "model": "claude-opus-4-6"},
@@ -89,5 +95,9 @@ def get_config() -> MobiusConfig:
         config.swarm_size = int(val)
     if val := os.environ.get("MOBIUS_BUDGET_USD"):
         config.global_budget_usd = float(val)
+    if os.environ.get("MOBIUS_SANDBOX", "").lower() in ("1", "true", "yes"):
+        config.sandbox_enabled = True
+    if val := os.environ.get("MOBIUS_SANDBOX_IMAGE"):
+        config.sandbox_image = val
 
     return config
diff --git a/src/mobius/orchestrator.py b/src/mobius/orchestrator.py
index bbff38f..207de21 100644
--- a/src/mobius/orchestrator.py
+++ b/src/mobius/orchestrator.py
@@ -10,6 +10,7 @@
 from mobius.judge import JudgePanel
 from mobius.memory import Memory
 from mobius.models import AgentRecord, JudgeVerdict, MatchRecord, MemoryEntry
+from mobius.providers.tools import create_sandbox, destroy_sandbox, set_sandbox
 from mobius.selector import Selector
 from mobius.swarm import Swarm, SwarmResult
 from mobius.tournament import Tournament
@@ -125,7 +126,24 @@ async def run_competition(
             [a.slug for a in agents],
         )
 
-        # 2. Run swarm
+        # 2. Set up sandbox if enabled
+        sandbox_name = None
+        if self.config.sandbox_enabled:
+            try:
+                sandbox_name = create_sandbox(
+                    image=self.config.sandbox_image,
+                    memory_limit=self.config.sandbox_memory_limit,
+                    network=self.config.sandbox_network,
+                    working_dir=working_dir,
+                )
+                set_sandbox(sandbox_name)
+                logger.info("Sandbox active: %s", sandbox_name)
+            except Exception as e:
+                logger.warning("Sandbox creation failed, running on host: %s", e)
+                sandbox_name = None
+                set_sandbox(None)
+
+        # 3. Run swarm
         ui = SwarmUI() if show_ui else None
         if ui:
             # Register agents for UI display
@@ -151,6 +169,9 @@ async def run_competition(
         finally:
             if ui:
                 ui.stop()
+            if sandbox_name:
+                set_sandbox(None)
+                destroy_sandbox(sandbox_name)
 
         # 3. Check if we have enough outputs to judge
         successful = swarm_result.successful_outputs
diff --git a/src/mobius/providers/tools.py b/src/mobius/providers/tools.py
index e853284..e1e51a6 100644
--- a/src/mobius/providers/tools.py
+++ b/src/mobius/providers/tools.py
@@ -2,6 +2,9 @@
 
 Each provider has its own format for declaring tools, but the underlying
 execution is identical: run a shell command, return the output.
+
+When sandbox mode is enabled, commands run inside a disposable Docker
+container instead of on the host.
 """
 
 from __future__ import annotations
@@ -9,18 +12,128 @@
 import logging
 import os
 import subprocess
+import uuid
 
 logger = logging.getLogger(__name__)
 
 
-def run_command(command: str, timeout: int = 30, working_dir: str | None = None) -> str:
-    """Execute a shell command and return output."""
+# ---------------------------------------------------------------------------
+# Sandbox container lifecycle
+# ---------------------------------------------------------------------------
+
+_active_containers: dict[str, str] = {}  # name -> container id
+_current_sandbox: str | None = None  # set by orchestrator for current competition
+
+
+def create_sandbox(
+    image: str = "python:3.12-slim",
+    memory_limit: str = "512m",
+    network: bool = False,
+    working_dir: str | None = None,
+) -> str:
+    """Create and start a warm sandbox container. Returns container name."""
+    name = f"mobius-sandbox-{uuid.uuid4().hex[:8]}"
+    cmd = [
+        "docker", "create",
+        "--name", name,
+        "--memory", memory_limit,
+        "--cpus", "1",
+        "--workdir", "/workspace",
+    ]
+    if working_dir:
+        cmd += ["-v", f"{working_dir}:/workspace"]
+    if not network:
+        cmd += ["--network", "none"]
+    cmd += [image, "sleep", "infinity"]
+
+    result = subprocess.run(cmd, capture_output=True, text=True, timeout=30)
+    if result.returncode != 0:
+        raise RuntimeError(f"Failed to create sandbox: {result.stderr.strip()}")
+
+    start_result = subprocess.run(
+        ["docker", "start", name],
+        capture_output=True, text=True, timeout=10,
+    )
+    if start_result.returncode != 0:
+        # Cleanup the created-but-not-started container
+        subprocess.run(
+            ["docker", "rm", "-f", name],
+            capture_output=True, text=True, timeout=10,
+        )
+        raise RuntimeError(f"Failed to start sandbox: {start_result.stderr.strip()}")
+
+    _active_containers[name] = result.stdout.strip()
+    logger.info("Sandbox created: %s (image=%s, network=%s)", name, image, network)
+    return name
+
+
+def destroy_sandbox(name: str) -> None:
+    """Stop and remove a sandbox container."""
     try:
-        result = subprocess.run(
-            command, shell=True, capture_output=True, text=True,
-            timeout=timeout, cwd=working_dir or os.getcwd(),
-            encoding="utf-8", errors="replace",
+        subprocess.run(
+            ["docker", "rm", "-f", name],
+            capture_output=True, text=True, timeout=15,
         )
+        _active_containers.pop(name, None)
+        logger.info("Sandbox destroyed: %s", name)
+    except Exception as e:
+        logger.warning("Failed to destroy sandbox %s: %s", name, e)
+
+
+def destroy_all_sandboxes() -> None:
+    """Clean up all active sandbox containers."""
+    for name in list(_active_containers):
+        destroy_sandbox(name)
+
+
+def set_sandbox(name: str | None) -> None:
+    """Set the active sandbox for all subsequent run_command calls."""
+    global _current_sandbox
+    _current_sandbox = name
+
+
+def get_current_sandbox() -> str | None:
+    """Return the name of the currently active sandbox, or None."""
+    return _current_sandbox
+
+
+# ---------------------------------------------------------------------------
+# Command execution
+# ---------------------------------------------------------------------------
+
+def run_command(
+    command: str,
+    timeout: int = 30,
+    working_dir: str | None = None,
+    sandbox: str | None = None,
+) -> str:
+    """Execute a shell command and return output.
+
+    Args:
+        command: The shell command to run.
+        timeout: Max seconds before killing the command.
+        working_dir: Working directory (host mode only).
+        sandbox: Container name to exec into. If None, uses current sandbox.
+    """
+    sandbox = sandbox or _current_sandbox
+    try:
+        if sandbox:
+            if sandbox not in _active_containers:
+                raise RuntimeError(
+                    f"Sandbox '{sandbox}' is not in active containers. "
+                    "Refusing to fall back to host execution."
+                )
+            result = subprocess.run(
+                ["docker", "exec", sandbox, "sh", "-lc", command],
+                capture_output=True, text=True, timeout=timeout,
+                encoding="utf-8", errors="replace",
+            )
+        else:
+            result = subprocess.run(
+                command, shell=True, capture_output=True, text=True,
+                timeout=timeout, cwd=working_dir or os.getcwd(),
+                encoding="utf-8", errors="replace",
+            )
         output = result.stdout
         if result.returncode != 0 and result.stderr:
             output += f"\n[stderr]: {result.stderr}"
diff --git a/src/mobius/runner.py b/src/mobius/runner.py
index 1749e3f..2ca46f9 100644
--- a/src/mobius/runner.py
+++ b/src/mobius/runner.py
@@ -12,6 +12,7 @@
 from mobius.providers.google import GoogleProvider
 from mobius.providers.openai import OpenAIProvider
 from mobius.providers.openrouter import OpenRouterProvider
+from mobius.providers.tools import get_current_sandbox
 
 logger = logging.getLogger(__name__)
 
@@ -66,10 +67,16 @@ def get_provider(provider_name: ProviderType) -> Provider:
 
 def _build_context_prefix(agent: AgentRecord, working_dir: str) -> str:
     """Build an environment context string so agents know what they can do."""
-    lines = [
-        f"Working directory: {os.path.basename(working_dir)}",
-        _PLATFORM_LINE,
-    ]
+    if get_current_sandbox():
+        lines = [
+            "Working directory: /workspace",
+            "Platform: Linux (sandboxed Docker container)",
+        ]
+    else:
+        lines = [
+            f"Working directory: {os.path.basename(working_dir)}",
+            _PLATFORM_LINE,
+        ]
 
     # Only advertise tools that are actually wired up in providers.
     tools = [t for t in (agent.tools or []) if t in _IMPLEMENTED_TOOLS]

From d519e586c2653ffe3ccd7c85543eeb208efef635 Mon Sep 17 00:00:00 2001
From: Aaron Goldsmith <aargoldsmith@gmail.com>
Date: Sat, 21 Mar 2026 09:31:20 -0700
Subject: [PATCH 2/3] Fix sandbox security: abort on creation failure, check
 destroy returncode

- orchestrator.py: Raise RuntimeError when sandbox creation fails and
  sandbox_enabled=True instead of silently falling back to host execution
- providers/tools.py: Check docker rm returncode before removing from
  _active_containers dict; only clean up tracking on success

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 src/mobius/orchestrator.py    |  7 ++++---
 src/mobius/providers/tools.py | 12 +++++++++---
 2 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/src/mobius/orchestrator.py b/src/mobius/orchestrator.py
index 207de21..243cb71 100644
--- a/src/mobius/orchestrator.py
+++ b/src/mobius/orchestrator.py
@@ -139,9 +139,10 @@ async def run_competition(
                 set_sandbox(sandbox_name)
                 logger.info("Sandbox active: %s", sandbox_name)
             except Exception as e:
-                logger.warning("Sandbox creation failed, running on host: %s", e)
-                sandbox_name = None
-                set_sandbox(None)
+                raise RuntimeError(
+                    f"Sandbox creation failed and sandbox_enabled=True, "
+                    f"refusing to run on host: {e}"
+                ) from e
 
         # 3. Run swarm
         ui = SwarmUI() if show_ui else None
diff --git a/src/mobius/providers/tools.py b/src/mobius/providers/tools.py
index e1e51a6..1de7dbb 100644
--- a/src/mobius/providers/tools.py
+++ b/src/mobius/providers/tools.py
@@ -70,12 +70,18 @@ def create_sandbox(
 def destroy_sandbox(name: str) -> None:
     """Stop and remove a sandbox container."""
     try:
-        subprocess.run(
+        result = subprocess.run(
             ["docker", "rm", "-f", name],
             capture_output=True, text=True, timeout=15,
         )
-        _active_containers.pop(name, None)
-        logger.info("Sandbox destroyed: %s", name)
+        if result.returncode == 0:
+            _active_containers.pop(name, None)
+            logger.info("Sandbox destroyed: %s", name)
+        else:
+            logger.warning(
+                "Failed to destroy sandbox %s: docker rm returned %d: %s",
+                name, result.returncode, result.stderr.strip(),
+            )
     except Exception as e:
         logger.warning("Failed to destroy sandbox %s: %s", name, e)
 

From ae33bf37c8eba0201cce7353a7cc58b9f3e0994b Mon Sep 17 00:00:00 2001
From: Aaron Goldsmith <aargoldsmith@gmail.com>
Date: Sat, 21 Mar 2026 10:14:10 -0700
Subject: [PATCH 3/3] Default working_dir to cwd when sandbox enabled

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 src/mobius/orchestrator.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/mobius/orchestrator.py b/src/mobius/orchestrator.py
index 243cb71..91d4253 100644
--- a/src/mobius/orchestrator.py
+++ b/src/mobius/orchestrator.py
@@ -3,6 +3,7 @@
 from __future__ import annotations
 
 import logging
+import os
 
 from mobius.config import MobiusConfig
 from mobius.db import vec_to_blob
@@ -129,6 +130,8 @@ async def run_competition(
         # 2. Set up sandbox if enabled
         sandbox_name = None
         if self.config.sandbox_enabled:
+            if working_dir is None:
+                working_dir = os.getcwd()
             try:
                 sandbox_name = create_sandbox(
                     image=self.config.sandbox_image,