diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index d86f522..3f89e9a 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -49,3 +49,23 @@ jobs:
           verbose: true
         env:
           CODECOV_TOKEN: ${{ secrets.CODECOV_TOKEN }}
+
+  test-deno-sandbox:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v6
+      - uses: astral-sh/setup-uv@v7
+      - uses: denoland/setup-deno@v2
+      - name: Cache Deno modules
+        uses: actions/cache@v5
+        with:
+          path: ~/.cache/deno
+          key: deno-${{ runner.os }}-${{ hashFiles('src/py_code_mode/execution/deno_sandbox/runner/**') }}
+          restore-keys: |
+            deno-${{ runner.os }}-
+      - run: uv sync --all-extras
+      - name: Run Deno sandbox integration tests
+        env:
+          PY_CODE_MODE_TEST_DENO: "1"
+          DENO_DIR: ~/.cache/deno
+        run: uv run pytest -n 0 tests/test_deno_sandbox_imports.py tests/test_deno_sandbox_executor.py -v
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index c83d99a..4fa6715 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -1,8 +1,8 @@
 repos:
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.8.0
+    # Keep in sync with the ruff version pinned in uv.lock / used in CI.
+    rev: v0.14.9
     hooks:
       - id: ruff
         args: [--fix]
       - id: ruff-format
-
diff --git a/AGENTS.md b/AGENTS.md
index 2200cfd..0e999b0 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -34,6 +34,7 @@ src/py_code_mode/
     subprocess/     # Jupyter kernel-based subprocess executor
     container/      # Docker container executor
     in_process/     # Same-process executor
+    deno_sandbox/   # Deno + Pyodide (WASM) sandbox executor (experimental)
   workflows/           # Skill storage, library, and vector stores
   tools/            # Tool adapters: CLI, MCP, HTTP
     adapters/       # CLI, MCP, HTTP adapter implementations
@@ -76,6 +77,7 @@ When agents write code, four namespaces are available:
 | SubprocessExecutor | Recommended default. Process isolation via Jupyter kernel. |
 | ContainerExecutor | Docker isolation for untrusted code. |
 | InProcessExecutor | Maximum speed for trusted code. |
+| DenoSandboxExecutor | Sandboxed Python via Deno + Pyodide (WASM). Tools execute host-side. |
 
 ---
 
@@ -98,6 +100,21 @@ uv run pytest -k "test_workflow"
 
 # Run without parallelism (for debugging)
 uv run pytest -n 0
+
+# Run Deno sandbox integration tests (requires Deno installed)
+PY_CODE_MODE_TEST_DENO=1 uv run pytest -n 0 tests/test_deno_sandbox_executor.py -v
+
+# Filter subsets (markers are defined in pyproject.toml)
+uv run pytest -m "not docker"
+
+# Common subsets
+uv run pytest -m "not slow"
+uv run pytest -m docker
+uv run pytest -m subprocess
+uv run pytest -m "not docker and not subprocess"
+
+# CI uses all extras; for local repro of CI failures you may want:
+uv sync --all-extras
 ```
 
 ### Linting and Type Checking
@@ -192,6 +209,7 @@ Tools are defined in YAML files. Key patterns:
 - Container tests are in `tests/container/` - require Docker
 - Use `@pytest.mark.xdist_group("group_name")` for tests that need isolation
 - Redis tests use testcontainers - spin up automatically
+- Markers like `docker`, `subprocess`, `venv`, and `deno` are used to filter test subsets
 
 ---
 
diff --git a/docs/ARCHITECTURE.md b/docs/ARCHITECTURE.md
index 2a5ecaf..3ca41b5 100644
--- a/docs/ARCHITECTURE.md
+++ b/docs/ARCHITECTURE.md
@@ -791,7 +791,7 @@ async with Session(storage=storage, executor=executor) as session:
 ### Tool Execution
 
 ```
-Agent writes: "tools.curl.get(url='...')"
+Agent writes: "tools.curl.get(url='...')" (use `await` only in DenoSandboxExecutor)
         |
         v
 +------------------------+
@@ -808,6 +808,12 @@ Agent writes: "tools.curl.get(url='...')"
                                    +--------------+
 ```
 
+Note on sandboxing:
+- `DenoSandboxExecutor` sandboxes Python execution in Pyodide, but **tools execute host-side** (the sandbox calls back to the host over RPC to run tools). If you need strict sandbox boundaries, avoid `tools.*` and stick to pure Python plus `deps.*` in the sandbox.
+
+Note on tool middleware:
+- Tool calls can be wrapped by a host-side middleware chain (audit logging, approvals, allow/deny, retries, etc.). Enforcement guarantees are strongest for `DenoSandboxExecutor`, because sandboxed Python can only access tools via host RPC.
+
 ### ToolProxy Methods
 
 ```
@@ -819,7 +825,7 @@ Agent writes: "tools.curl.get(url='...')"
 |                        |
 | .call_async(**kwargs)  |--> Always returns awaitable
 | .call_sync(**kwargs)   |--> Always blocks, returns result
-| .__call__(**kwargs)    |--> Context-aware (sync/async detection)
+| .__call__(**kwargs)    |--> Synchronous invocation
 +------------------------+
         |
         v
@@ -828,14 +834,14 @@ Agent writes: "tools.curl.get(url='...')"
 |                        |
 | .call_async(**kwargs)  |--> Always returns awaitable
 | .call_sync(**kwargs)   |--> Always blocks, returns result
-| .__call__(**kwargs)    |--> Context-aware (sync/async detection)
+| .__call__(**kwargs)    |--> Synchronous invocation
 +------------------------+
 ```
 
 ### Skill Execution
 
 ```
-Agent writes: "workflows.analyze_repo(repo='...')"
+Agent writes: "workflows.analyze_repo(repo='...')" (use `await` only in DenoSandboxExecutor)
         |
         v
 +------------------------+
@@ -880,7 +886,7 @@ Skill has access to:
 ### Artifact Storage
 
 ```
-Agent writes: "artifacts.save('data.json', b'...', 'description')"
+Agent writes: "artifacts.save('data.json', b'...', 'description')" (use `await` only in DenoSandboxExecutor)
         |
         v
 +------------------------+
diff --git a/docs/executors.md b/docs/executors.md
index f491439..e8ff816 100644
--- a/docs/executors.md
+++ b/docs/executors.md
@@ -1,6 +1,60 @@
 # Executors
 
-Executors determine where and how agent code runs. Three backends are available: Subprocess, Container, and InProcess.
+Executors determine where and how agent code runs. Four backends are available: Subprocess, Container, InProcess, and DenoSandbox (experimental).
+
+## DenoSandboxExecutor (Experimental, Sandboxed)
+
+`DenoSandboxExecutor` runs Python in **Pyodide (WASM)** inside a **Deno** subprocess. It relies on the Deno permission model for sandboxing.
+
+Notes:
+- Backend key: `"deno-sandbox"`.
+- Example: `examples/deno-sandbox/`.
+
+Key differences vs the other executors:
+- **Async-first sandbox API**: use `await tools.*`, `await workflows.*`, `await artifacts.*`, `await deps.*`.
+- **Best-effort deps**: dependency installs run via Pyodide `micropip` and many packages (especially those requiring native extensions) will not work.
+- **Tool middleware support (host-side)**: you can attach tool call middleware via `DenoSandboxConfig.tool_middlewares` (useful for audit logging, approvals, allow/deny, etc.).
+
+```python
+from pathlib import Path
+from py_code_mode import Session, FileStorage
+from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+
+storage = FileStorage(base_path=Path("./data"))
+
+config = DenoSandboxConfig(
+    tools_path=Path("./tools"),
+    deno_dir=Path("./.deno-cache"),  # Deno cache directory (used with --cached-only)
+    network_profile="deps-only",     # "none" | "deps-only" | "full"
+    default_timeout=60.0,
+)
+
+executor = DenoSandboxExecutor(config)
+
+async with Session(storage=storage, executor=executor) as session:
+    result = await session.run("await tools.list()")
+```
+
+### Security Model: Where Tools Execute
+
+`DenoSandboxExecutor` sandboxes **Python execution** (the Pyodide runtime) inside a Deno subprocess. However, **tool execution is host-side**:
+- If your agent calls `tools.*` while using `DenoSandboxExecutor`, the call is proxied over RPC back to the host Python process, and the tool runs there (using the configured ToolAdapters).
+- This means a YAML tool that can read files, run commands, or access the network will do so with **host permissions**, not Deno sandbox permissions.
+
+Practical guidance:
+- If you want "true sandboxed code exec", keep agent code to **pure Python + `deps.*`** (Pyodide `micropip`) and avoid `tools.*`.
+- If you attach host tools, treat them as a privileged escape hatch from the sandbox boundary.
+
+### Network Profiles
+
+`DenoSandboxConfig.network_profile` controls network access for the Deno subprocess:
+- `none`: deny all network access (no runtime dep installs)
+- `deps-only`: allow access to PyPI/CDN hosts needed for common `micropip` installs
+- `full`: allow all network access
+
+### Timeout And Reset
+
+Timeouts are **soft** (the host stops waiting). If an execution times out, the session may be wedged until you call `session.reset()`, which restarts the sandbox.
 
 ## Quick Decision Guide
 
@@ -17,20 +71,24 @@ Need stronger isolation? → ContainerExecutor
   - Filesystem and network isolation
   - Requires Docker
 
+Want sandboxing without Docker (and can accept Pyodide limitations)? → DenoSandboxExecutor (experimental)
+  - WASM-based Python runtime + Deno permission model
+  - Network and filesystem sandboxing via Deno permissions
+
 Need maximum speed AND trust the code completely? → InProcessExecutor
   - No isolation (runs in your process)
   - Only for trusted code you control
 ```
 
-| Requirement | Subprocess | Container | InProcess |
-|-------------|------------|-----------|-----------|
-| **Recommended for most users** | **Yes** | | |
-| Process isolation | Yes | Yes | No |
-| Crash recovery | Yes | Yes | No |
-| Container isolation | No | Yes | No |
-| No Docker required | Yes | No | Yes |
-| Resource limits | Partial | Full | No |
-| Untrusted code | No | Yes | No |
+| Requirement | Subprocess | Container | DenoSandbox | InProcess |
+|-------------|------------|-----------|------------|-----------|
+| **Recommended for most users** | **Yes** | | | |
+| Process isolation | Yes | Yes | Yes | No |
+| Crash recovery | Yes | Yes | Yes | No |
+| Container isolation | No | Yes | No | No |
+| No Docker required | Yes | No | Yes | Yes |
+| Resource limits | Partial | Full | Partial | No |
+| Untrusted code | No | Yes | Yes (experimental) | No |
 
 ---
 
diff --git a/docs/tools.md b/docs/tools.md
index 2597817..c0544d3 100644
--- a/docs/tools.md
+++ b/docs/tools.md
@@ -8,6 +8,23 @@ Tools wrap external capabilities as callable functions. Three adapter types supp
 
 Define command-line tools with YAML schema + recipes.
 
+## Tool Middleware (Experimental)
+
+py-code-mode supports a host-side middleware chain around tool execution. This is intended for:
+- Audit logging and metrics
+- Allow/deny decisions and interactive approvals
+- Argument rewriting, retries, caching, etc.
+
+Notes:
+- Middleware runs where tools execute (host-side ToolAdapters).
+- Enforcement guarantees are strongest with `DenoSandboxExecutor` because sandboxed Python can only access tools via RPC back to the host.
+
+API surface:
+- `ToolMiddleware`: `async def __call__(ctx: ToolCallContext, call_next) -> Any`
+- `ToolCallContext`: includes `tool_name`, `callable_name`, `args`, and metadata like `executor_type`, `origin`, `request_id`.
+
+To enable for `DenoSandboxExecutor`, pass `tool_middlewares` in `DenoSandboxConfig`.
+
 ### Schema Definition
 
 ```yaml
@@ -89,6 +106,13 @@ recipes:
 
 ### Agent Usage
 
+Tool calls inside `Session.run()` are **synchronous** in the default executors (Subprocess/Container/InProcess).
+
+Notes:
+- If you need async tool calls in Python code, use `call_async(...)` explicitly.
+- In `DenoSandboxExecutor`, tool calls are **async-first** and you must use `await tools.*`.
+- In `DenoSandboxExecutor`, tool calls execute **outside** the sandbox: `await tools.*` is an RPC back to the host Python process, and the tool runs with host permissions (or container permissions if the tool adapter/executor is containerized).
+
 ```python
 # Recipe invocation (recommended)
 tools.curl.get(url="https://api.github.com/repos/owner/repo")
@@ -103,9 +127,13 @@ tools.curl(
 )
 
 # Discovery
-tools.list()                    # All tools
-tools.search("http")            # Search by name/description/tags
-tools.curl.list()               # Recipes for a specific tool
+tools.list()              # All tools
+tools.search("http")      # Search by name/description/tags
+tools.curl.list()         # Recipes for a specific tool
+
+# Explicit async (if you need it)
+await tools.curl.call_async(url="https://example.com")
+await tools.curl.get.call_async(url="https://example.com")
 ```
 
 ## MCP Tools
diff --git a/docs/workflows.md b/docs/workflows.md
index b0ca0c5..0857f8c 100644
--- a/docs/workflows.md
+++ b/docs/workflows.md
@@ -10,13 +10,14 @@ Over time, the workflow library grows. Simple workflows become building blocks f
 
 ## Creating Workflows
 
-Workflows are async Python functions with an `async def run()` entry point:
+Workflows are Python functions with a `run()` entry point. Both `def run(...)` and
+`async def run(...)` are supported:
 
 ```python
 # workflows/fetch_json.py
 """Fetch and parse JSON from a URL."""
 
-async def run(url: str, headers: dict = None) -> dict:
+def run(url: str, headers: dict = None) -> dict:
     """Fetch JSON data from a URL.
 
     Args:
@@ -37,7 +38,7 @@ async def run(url: str, headers: dict = None) -> dict:
         raise RuntimeError(f"Invalid JSON from {url}: {e}") from e
 ```
 
-> **Note:** All workflows must use `async def run()`. Synchronous `def run()` is not supported.
+> **Note:** If your workflow uses `async def run(...)`, it can still call tools/workflows/artifacts synchronously.
 
 ### Runtime Creation
 
@@ -46,7 +47,7 @@ Agents can create workflows dynamically:
 ```python
 workflows.create(
     name="fetch_json",
-    source='''async def run(url: str) -> dict:
+    source='''def run(url: str) -> dict:
     """Fetch and parse JSON from a URL."""
     import json
     response = tools.curl.get(url=url)
@@ -96,7 +97,7 @@ Workflows can invoke other workflows, enabling layered workflows:
 
 ```python
 # workflows/fetch_json.py
-async def run(url: str) -> dict:
+def run(url: str) -> dict:
     """Fetch and parse JSON from a URL."""
     import json
     response = tools.curl.get(url=url)
@@ -107,11 +108,13 @@ async def run(url: str) -> dict:
 
 ```python
 # workflows/get_repo_metadata.py
-async def run(owner: str, repo: str) -> dict:
+def run(owner: str, repo: str) -> dict:
     """Get GitHub repository metadata."""
     # Uses the fetch_json workflow
-    data = workflows.invoke("fetch_json",
-                         url=f"https://api.github.com/repos/{owner}/{repo}")
+    data = workflows.invoke(
+        "fetch_json",
+        url=f"https://api.github.com/repos/{owner}/{repo}",
+    )
 
     return {
         "name": data["name"],
@@ -125,7 +128,7 @@ async def run(owner: str, repo: str) -> dict:
 
 ```python
 # workflows/analyze_multiple_repos.py
-async def run(repos: list) -> dict:
+def run(repos: list) -> dict:
     """Analyze multiple GitHub repositories."""
     summaries = []
     for repo in repos:
diff --git a/examples/deno-sandbox/.gitignore b/examples/deno-sandbox/.gitignore
new file mode 100644
index 0000000..cc2f05a
--- /dev/null
+++ b/examples/deno-sandbox/.gitignore
@@ -0,0 +1,5 @@
+data/
+.deno-cache/
+__pycache__/
+.pytest_cache/
+
diff --git a/examples/deno-sandbox/README.md b/examples/deno-sandbox/README.md
new file mode 100644
index 0000000..ae37461
--- /dev/null
+++ b/examples/deno-sandbox/README.md
@@ -0,0 +1,36 @@
+# DenoSandboxExecutor Example
+
+Demonstrates sandboxed Python execution using `DenoSandboxExecutor` (Deno + Pyodide).
+
+## What Is DenoSandboxExecutor?
+
+`DenoSandboxExecutor` runs Python in **Pyodide (WASM)** inside a **Deno** subprocess and uses Deno permissions to sandbox the Python runtime.
+
+Important: **tools execute host-side**. Any `tools.*` call is sent over RPC to the host Python process and executed by ToolAdapters with host permissions.
+
+## Prerequisites
+
+- Python 3.12+
+- Deno installed and on PATH
+
+## Setup
+
+```bash
+cd examples/deno-sandbox
+uv sync
+```
+
+## Run
+
+```bash
+uv run python example.py
+```
+
+## Notes
+
+- In `DenoSandboxExecutor`, namespace calls are async-first: use `await tools.*`, `await artifacts.*`, `await workflows.*`, `await deps.*`.
+- `DenoSandboxConfig.network_profile` controls *sandbox* network access:
+  - `none`: deny sandbox network (no runtime `micropip` installs)
+  - `deps-only`: allow typical PyPI/CDN hosts for `micropip`
+  - `full`: allow all sandbox network
+
diff --git a/examples/deno-sandbox/example.py b/examples/deno-sandbox/example.py
new file mode 100644
index 0000000..1180993
--- /dev/null
+++ b/examples/deno-sandbox/example.py
@@ -0,0 +1,71 @@
+#!/usr/bin/env python3
+"""DenoSandboxExecutor example - Deno + Pyodide (WASM) sandbox.
+
+Highlights:
+- Python code executes inside Pyodide (WASM) within a Deno subprocess.
+- In DenoSandboxExecutor, namespace calls are async-first:
+  - use `await tools.*`, `await artifacts.*`, `await workflows.*`, `await deps.*`
+- Tool execution is host-side: `tools.*` calls are RPC'd back to the host and
+  executed by ToolAdapters with host permissions.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import shutil
+from pathlib import Path
+
+from py_code_mode import FileStorage, Session
+from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+
+HERE = Path(__file__).resolve().parent
+
+
+async def main() -> None:
+    if shutil.which("deno") is None:
+        raise SystemExit(
+            "deno not found on PATH. Install Deno to run this example: https://deno.com/"
+        )
+
+    storage = FileStorage(base_path=HERE / "data")
+    deno_dir = HERE / ".deno-cache"
+    tools_dir = HERE / "tools"
+
+    config = DenoSandboxConfig(
+        tools_path=tools_dir,
+        deno_dir=deno_dir,
+        # Start with no sandbox network access. (Tools still run host-side.)
+        network_profile="none",
+        default_timeout=60.0,
+        ipc_timeout=120.0,
+    )
+    executor = DenoSandboxExecutor(config)
+
+    async with Session(storage=storage, executor=executor) as session:
+        print("Basic execution (sandboxed Python)...")
+        r = await session.run("1 + 1")
+        print("  1 + 1 =", r.value)
+
+        print("\nTool call (HOST-SIDE, via RPC)...")
+        r = await session.run("(await tools.echo.say(message='hello from host tool')).strip()")
+        print("  tools.echo.say ->", r.value)
+
+        print("\nArtifacts (stored via host storage backend)...")
+        await session.run("await artifacts.save('hello.txt', 'hi', description='demo')")
+        r = await session.run("await artifacts.load('hello.txt')")
+        print("  artifacts.load('hello.txt') ->", r.value)
+
+        print("\nWorkflows (stored in host storage; executed in sandbox)...")
+        src = "async def run(x: int) -> int:\\n    return x * 2\\n"
+        await session.run(f"await workflows.create('double', {src!r}, description='Multiply by 2')")
+        r = await session.run("await workflows.invoke(workflow_name='double', x=21)")
+        print("  workflows.invoke('double', x=21) ->", r.value)
+
+        print("\nStdout capture...")
+        r = await session.run('print("hello from sandbox stdout")\\n"done"')
+        print("  value:", r.value)
+        print("  stdout:", r.stdout.strip())
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/examples/deno-sandbox/pyproject.toml b/examples/deno-sandbox/pyproject.toml
new file mode 100644
index 0000000..ec09701
--- /dev/null
+++ b/examples/deno-sandbox/pyproject.toml
@@ -0,0 +1,15 @@
+[project]
+name = "py-code-mode-deno-sandbox-example"
+version = "0.1.0"
+description = "DenoSandboxExecutor example using Deno + Pyodide sandbox"
+requires-python = ">=3.12"
+dependencies = [
+    "py-code-mode",
+]
+
+[tool.uv]
+dev-dependencies = []
+
+[tool.uv.sources]
+py-code-mode = { path = "../..", editable = true }
+
diff --git a/examples/deno-sandbox/tools/echo.yaml b/examples/deno-sandbox/tools/echo.yaml
new file mode 100644
index 0000000..85a44cb
--- /dev/null
+++ b/examples/deno-sandbox/tools/echo.yaml
@@ -0,0 +1,18 @@
+name: echo
+description: Echo text (host-side tool; executed outside the Deno sandbox)
+command: /bin/echo
+timeout: 5
+
+schema:
+  positional:
+    - name: message
+      type: string
+      required: true
+      description: Message to echo
+
+recipes:
+  say:
+    description: Echo the message
+    params:
+      message: {}
+
diff --git a/pyproject.toml b/pyproject.toml
index eacc782..b55b556 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -98,6 +98,14 @@ python_files = ["test_*.py"]
 python_classes = ["Test*"]
 python_functions = ["test_*"]
 addopts = "-n auto --dist loadgroup"
+markers = [
+    "slow: Long-running tests (often subprocess/docker integration).",
+    "integration: Integration tests that may require external services (e.g. Redis).",
+    "docker: Tests that require Docker (typically xdist_group('docker')).",
+    "subprocess: Tests that use the SubprocessExecutor / kernel subprocess (typically xdist_group('subprocess')).",
+    "venv: Tests that touch venv caching/management (typically xdist_group('venv')).",
+    "deno: Tests that require Deno (DenoSandboxExecutor integration).",
+]
 
 [tool.ruff]
 target-version = "py312"
diff --git a/src/py_code_mode/artifacts/__init__.py b/src/py_code_mode/artifacts/__init__.py
index 1240bad..79e4454 100644
--- a/src/py_code_mode/artifacts/__init__.py
+++ b/src/py_code_mode/artifacts/__init__.py
@@ -5,11 +5,13 @@
     ArtifactStoreProtocol,
 )
 from py_code_mode.artifacts.file import FileArtifactStore
+from py_code_mode.artifacts.namespace import ArtifactsNamespace
 from py_code_mode.artifacts.redis import RedisArtifactStore
 
 __all__ = [
     "Artifact",
     "ArtifactStoreProtocol",
     "FileArtifactStore",
+    "ArtifactsNamespace",
     "RedisArtifactStore",
 ]
diff --git a/src/py_code_mode/artifacts/namespace.py b/src/py_code_mode/artifacts/namespace.py
new file mode 100644
index 0000000..6fb85a1
--- /dev/null
+++ b/src/py_code_mode/artifacts/namespace.py
@@ -0,0 +1,57 @@
+"""ArtifactsNamespace - agent-facing API for artifact storage."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Any
+
+if TYPE_CHECKING:
+    from py_code_mode.artifacts.base import ArtifactStoreProtocol
+
+
+class ArtifactsNamespace:
+    """Agent-facing namespace for artifacts.
+
+    Provides:
+    - artifacts.save(name, data, description="", metadata=None)
+    - artifacts.load(name)
+    - artifacts.list()
+    - artifacts.exists(name)
+    - artifacts.get(name)
+    - artifacts.delete(name)
+
+    This wrapper intentionally exposes a subset of the underlying store API to
+    keep the sandbox surface stable.
+    """
+
+    def __init__(self, store: ArtifactStoreProtocol) -> None:
+        self._store = store
+
+    @property
+    def path(self) -> Any:
+        # Keep compatibility with FileArtifactStore.path.
+        return getattr(self._store, "path", None)
+
+    def save(
+        self,
+        name: str,
+        data: Any,
+        description: str = "",
+        metadata: dict[str, Any] | None = None,
+    ) -> Any:
+        return self._store.save(name, data, description=description, metadata=metadata)
+
+    def load(self, name: str) -> Any:
+        return self._store.load(name)
+
+    def list(self) -> Any:
+        return self._store.list()
+
+    def exists(self, name: str) -> Any:
+        return bool(self._store.exists(name))
+
+    def get(self, name: str) -> Any:
+        return self._store.get(name)
+
+    def delete(self, name: str) -> Any:
+        self._store.delete(name)
+        return None
diff --git a/src/py_code_mode/deps/async_namespace.py b/src/py_code_mode/deps/async_namespace.py
new file mode 100644
index 0000000..d357624
--- /dev/null
+++ b/src/py_code_mode/deps/async_namespace.py
@@ -0,0 +1,65 @@
+"""Deprecated: async-capable wrapper for deps namespace.
+
+Kept for potential future use. The primary agent-facing API is synchronous.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+from py_code_mode.deps.namespace import DepsNamespace
+
+
+def _in_async_context() -> bool:
+    try:
+        asyncio.get_running_loop()
+    except RuntimeError:
+        return False
+    return True
+
+
+class AsyncDepsNamespace:
+    """Wrapper around DepsNamespace providing optional await support."""
+
+    def __init__(self, wrapped: DepsNamespace) -> None:
+        self._wrapped = wrapped
+
+    def add(self, package: str) -> Any:
+        if _in_async_context():
+
+            async def _coro() -> Any:
+                return self._wrapped.add(package)
+
+            return _coro()
+        return self._wrapped.add(package)
+
+    def list(self) -> Any:
+        if _in_async_context():
+
+            async def _coro() -> list[str]:
+                return self._wrapped.list()
+
+            return _coro()
+        return self._wrapped.list()
+
+    def remove(self, package: str) -> Any:
+        if _in_async_context():
+
+            async def _coro() -> bool:
+                return self._wrapped.remove(package)
+
+            return _coro()
+        return self._wrapped.remove(package)
+
+    def sync(self) -> Any:
+        if _in_async_context():
+
+            async def _coro() -> Any:
+                return self._wrapped.sync()
+
+            return _coro()
+        return self._wrapped.sync()
+
+    def __repr__(self) -> str:
+        return repr(self._wrapped)
diff --git a/src/py_code_mode/execution/__init__.py b/src/py_code_mode/execution/__init__.py
index 0eae687..b2ed079 100644
--- a/src/py_code_mode/execution/__init__.py
+++ b/src/py_code_mode/execution/__init__.py
@@ -35,6 +35,16 @@
     SubprocessConfig = None  # type: ignore
     SubprocessExecutor = None  # type: ignore
 
+# Deno sandbox is optional at runtime (requires deno + pyodide assets).
+try:
+    from py_code_mode.execution.deno_sandbox import DenoSandboxConfig, DenoSandboxExecutor
+
+    DENO_SANDBOX_AVAILABLE = True
+except Exception:
+    DENO_SANDBOX_AVAILABLE = False
+    DenoSandboxConfig = None  # type: ignore
+    DenoSandboxExecutor = None  # type: ignore
+
 __all__ = [
     "Capability",
     "Executor",
@@ -52,4 +62,7 @@
     "SubprocessExecutor",
     "SubprocessConfig",
     "SUBPROCESS_AVAILABLE",
+    "DenoSandboxExecutor",
+    "DenoSandboxConfig",
+    "DENO_SANDBOX_AVAILABLE",
 ]
diff --git a/src/py_code_mode/execution/deno_sandbox/__init__.py b/src/py_code_mode/execution/deno_sandbox/__init__.py
new file mode 100644
index 0000000..c3d1e15
--- /dev/null
+++ b/src/py_code_mode/execution/deno_sandbox/__init__.py
@@ -0,0 +1,10 @@
+"""Deno sandbox execution backend.
+
+This backend runs Python inside Pyodide (WASM) hosted by a Deno subprocess.
+It is intended to provide a sandboxed runtime without requiring Docker.
+"""
+
+from py_code_mode.execution.deno_sandbox.config import DenoSandboxConfig
+from py_code_mode.execution.deno_sandbox.executor import DenoSandboxExecutor
+
+__all__ = ["DenoSandboxConfig", "DenoSandboxExecutor"]
diff --git a/src/py_code_mode/execution/deno_sandbox/config.py b/src/py_code_mode/execution/deno_sandbox/config.py
new file mode 100644
index 0000000..c0bc5a3
--- /dev/null
+++ b/src/py_code_mode/execution/deno_sandbox/config.py
@@ -0,0 +1,55 @@
+"""Configuration for DenoSandboxExecutor."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Literal
+
+from py_code_mode.tools.middleware import ToolMiddleware
+
+
+@dataclass(frozen=True)
+class DenoSandboxConfig:
+    """Configuration for DenoSandboxExecutor.
+
+    Notes:
+    - This executor expects Pyodide runtime assets (WASM + stdlib files) to be
+      present on disk and readable by the Deno subprocess.
+    - Dependency installs are best-effort via Pyodide; many wheels will not work.
+    """
+
+    default_timeout: float | None = 60.0
+    allow_runtime_deps: bool = True
+    tools_path: Path | None = None
+    deps: tuple[str, ...] | None = None
+    deps_file: Path | None = None
+    ipc_timeout: float = 30.0
+    deps_timeout: float | None = 300.0
+
+    deno_executable: str = "deno"
+    # If None, the executor uses the packaged runner script adjacent to this module.
+    runner_path: Path | None = None
+
+    # Directory used for Deno's module/npm cache (DENO_DIR). If None, a default
+    # per-user cache directory is used. This cache is prepared outside the
+    # sandbox (host) via `deno cache`, then the sandbox runs with --cached-only.
+    deno_dir: Path | None = None
+
+    # Network profile:
+    # - "none": deny all network access (no runtime dep installs)
+    # - "deps-only": allow just enough for micropip / pyodide package fetches
+    # - "full": allow all network access
+    network_profile: Literal["none", "deps-only", "full"] = "full"
+
+    # Used when network_profile="deps-only".
+    deps_net_allowlist: tuple[str, ...] = (
+        "pypi.org",
+        "files.pythonhosted.org",
+        "cdn.jsdelivr.net",
+    )
+
+    # Optional host-side middleware invoked around tool calls.
+    # This is enforced for DenoSandbox tool calls because all `tools.*` calls
+    # are proxied back to the host Python process.
+    tool_middlewares: tuple[ToolMiddleware, ...] = ()
diff --git a/src/py_code_mode/execution/deno_sandbox/executor.py b/src/py_code_mode/execution/deno_sandbox/executor.py
new file mode 100644
index 0000000..1de2cab
--- /dev/null
+++ b/src/py_code_mode/execution/deno_sandbox/executor.py
@@ -0,0 +1,618 @@
+"""Deno + Pyodide execution backend.
+
+This executor runs Python inside Pyodide (WASM) in a Deno subprocess.
+
+It uses an NDJSON IPC protocol and a host-side provider to service sandbox
+namespace proxy operations (tools/workflows/artifacts/deps persistence).
+"""
+
+from __future__ import annotations
+
+import asyncio
+import json
+import logging
+import os
+import shutil
+import uuid
+from dataclasses import dataclass
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+from py_code_mode.deps import (
+    FileDepsStore,
+    MemoryDepsStore,
+    RuntimeDepsDisabledError,
+    collect_configured_deps,
+)
+from py_code_mode.deps.store import DepsStore
+from py_code_mode.execution.deno_sandbox.config import DenoSandboxConfig
+from py_code_mode.execution.protocol import Capability, validate_storage_not_access
+from py_code_mode.execution.registry import register_backend
+from py_code_mode.execution.resource_provider import StorageResourceProvider
+from py_code_mode.tools import ToolRegistry, load_tools_from_path
+from py_code_mode.types import ExecutionResult
+
+if TYPE_CHECKING:
+    from asyncio.subprocess import Process
+
+    from py_code_mode.storage.backends import StorageBackend
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass(frozen=True)
+class _Pending:
+    fut: asyncio.Future[dict[str, Any]]
+
+
+class DenoSandboxExecutor:
+    """Execute code in Pyodide hosted by Deno.
+
+    Capabilities:
+    - TIMEOUT: Yes (soft timeout in host wait; does not interrupt sandbox run)
+    - PROCESS_ISOLATION: Yes (Deno subprocess)
+    - NETWORK_ISOLATION: Yes (Deno permissions; default deny)
+    - FILESYSTEM_ISOLATION: Partial (Deno permissions; allow-read to Pyodide assets)
+    - RESET: Yes (restart Deno subprocess)
+    - DEPS_INSTALL / DEPS_UNINSTALL: Best-effort (Pyodide/micropip)
+    """
+
+    _CAPABILITIES = frozenset(
+        {
+            Capability.TIMEOUT,
+            Capability.PROCESS_ISOLATION,
+            Capability.NETWORK_ISOLATION,
+            Capability.NETWORK_FILTERING,
+            Capability.FILESYSTEM_ISOLATION,
+            Capability.RESET,
+            Capability.DEPS_INSTALL,
+            Capability.DEPS_UNINSTALL,
+        }
+    )
+
+    def __init__(self, config: DenoSandboxConfig | None = None) -> None:
+        self._config = config or DenoSandboxConfig()
+        self._proc: Process | None = None
+        self._stdout_task: asyncio.Task[None] | None = None
+        self._stderr_task: asyncio.Task[None] | None = None
+        self._pending: dict[str, _Pending] = {}
+        self._closed = False
+        self._wedged = False  # indicates a soft-timeout run may still be executing
+        self._deno_dir: Path | None = None
+
+        self._storage: StorageBackend | None = None
+        self._provider: StorageResourceProvider | None = None
+        self._tool_registry: ToolRegistry | None = None
+        self._deps_store: DepsStore | None = None
+
+    def supports(self, capability: str) -> bool:
+        return capability in self._CAPABILITIES
+
+    def supported_capabilities(self) -> set[str]:
+        return set(self._CAPABILITIES)
+
+    def get_configured_deps(self) -> list[str]:
+        return collect_configured_deps(self._config.deps, self._config.deps_file)
+
+    async def __aenter__(self) -> DenoSandboxExecutor:
+        return self
+
+    async def __aexit__(self, exc_type: Any, exc_val: Any, exc_tb: Any) -> None:
+        await self.close()
+
+    async def start(self, storage: StorageBackend | None = None) -> None:
+        validate_storage_not_access(storage, "DenoSandboxExecutor")
+        if self._proc is not None:
+            return
+
+        if shutil.which(self._config.deno_executable) is None:
+            raise RuntimeError(f"deno not found: {self._config.deno_executable!r}")
+
+        self._storage = storage
+        self._deno_dir = (self._config.deno_dir or self._default_deno_dir()).expanduser().resolve()
+        self._deno_dir.mkdir(parents=True, exist_ok=True)
+
+        # Tools from executor config
+        if self._config.tools_path is not None:
+            self._tool_registry = await load_tools_from_path(self._config.tools_path)
+        else:
+            self._tool_registry = ToolRegistry()
+        if self._config.tool_middlewares:
+            self._tool_registry.apply_tool_middlewares(
+                self._config.tool_middlewares,
+                executor_type="deno-sandbox",
+                origin="deno-sandbox",
+            )
+
+        # Deps store from executor config (persistence only; installs happen in sandbox)
+        initial_deps = collect_configured_deps(self._config.deps, self._config.deps_file)
+        if self._config.deps_file:
+            self._deps_store = FileDepsStore(self._config.deps_file.parent)
+            for dep in initial_deps:
+                if not self._deps_store.exists(dep):
+                    self._deps_store.add(dep)
+        else:
+            self._deps_store = MemoryDepsStore()
+            for dep in initial_deps:
+                self._deps_store.add(dep)
+
+        if storage is not None:
+            self._provider = StorageResourceProvider(
+                storage=storage,
+                tool_registry=self._tool_registry,
+                deps_store=self._deps_store,
+                allow_runtime_deps=self._config.allow_runtime_deps,
+            )
+
+        await self._ensure_deno_cache()
+        await self._spawn_runner()
+
+    def _default_deno_dir(self) -> Path:
+        return Path.home() / ".cache" / "py-code-mode" / "deno-sandbox"
+
+    async def _ensure_deno_cache(self) -> None:
+        """Cache runner modules + npm:pyodide outside the sandbox."""
+        runner_path = self._config.runner_path or (
+            Path(__file__).resolve().parent / "runner" / "main.ts"
+        )
+        worker_path = runner_path.parent / "worker.ts"
+        deno_dir = self._deno_dir
+        assert deno_dir is not None
+
+        cmd = [
+            self._config.deno_executable,
+            "cache",
+            "--quiet",
+            "--no-check",
+            str(runner_path),
+            str(worker_path),
+        ]
+        proc = await asyncio.create_subprocess_exec(
+            *cmd,
+            env={**os.environ, "DENO_DIR": str(deno_dir)},
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        _out, err = await proc.communicate()
+        if proc.returncode != 0:
+            raise RuntimeError(f"deno cache failed: {err.decode('utf-8', errors='replace')}")
+
+    async def _spawn_runner(self) -> None:
+        runner_path = self._config.runner_path or (
+            Path(__file__).resolve().parent / "runner" / "main.ts"
+        )
+        runner_dir = runner_path.parent.resolve()
+        deno_dir = self._deno_dir
+        assert deno_dir is not None
+
+        # Sandbox defaults: cached-only + deny-net.
+        allow_reads = [runner_dir, deno_dir]
+
+        deno_args: list[str] = [
+            self._config.deno_executable,
+            "run",
+            "--quiet",
+            "--no-check",
+            "--no-prompt",
+            "--cached-only",
+            "--location=https://pyodide.invalid/",
+            "--deny-env",
+            "--deny-run",
+        ]
+        # Pyodide caches wheels into the Deno npm cache under DENO_DIR.
+        # Allow writes only to that cache directory.
+        deno_args.append(f"--allow-write={deno_dir}")
+        profile = self._config.network_profile
+        if profile == "full":
+            deno_args.append("--allow-net")
+        elif profile == "deps-only":
+            allow = ",".join(self._config.deps_net_allowlist)
+            deno_args.append(f"--allow-net={allow}")
+        elif profile == "none":
+            deno_args.append("--deny-net")
+        else:
+            raise ValueError(f"unknown network_profile: {profile!r}")
+
+        deno_args.append(f"--allow-read={','.join(str(p) for p in allow_reads)}")
+        deno_args.append(str(runner_path))
+
+        self._proc = await asyncio.create_subprocess_exec(
+            *deno_args,
+            stdin=asyncio.subprocess.PIPE,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+            env={**os.environ, "DENO_DIR": str(deno_dir)},
+        )
+
+        assert self._proc.stdin is not None
+        assert self._proc.stdout is not None
+
+        self._stdout_task = asyncio.create_task(self._stdout_loop())
+        self._stderr_task = asyncio.create_task(self._stderr_loop())
+
+        # Initialize runner with runtime directory and wait for ready.
+        init_id = uuid.uuid4().hex
+        ready = await self._request(
+            {
+                "id": init_id,
+                "type": "init",
+            },
+            timeout=self._config.ipc_timeout,
+        )
+        if ready.get("type") != "ready":
+            raise RuntimeError(f"Runner init failed: {ready!r}")
+
+        self._wedged = False
+
+    async def _stdout_loop(self) -> None:
+        assert self._proc is not None and self._proc.stdout is not None
+        reader = self._proc.stdout
+        while True:
+            line = await reader.readline()
+            if not line:
+                return
+            try:
+                msg = json.loads(line.decode("utf-8", errors="replace"))
+            except Exception:
+                continue
+            if not isinstance(msg, dict):
+                continue
+
+            msg_type = msg.get("type")
+            msg_id = msg.get("id")
+
+            if msg_type == "rpc_request":
+                await self._handle_rpc_request(msg)
+                continue
+
+            if isinstance(msg_id, str) and msg_id in self._pending:
+                pending = self._pending.pop(msg_id)
+                if not pending.fut.done():
+                    pending.fut.set_result(msg)
+
+    async def _stderr_loop(self) -> None:
+        assert self._proc is not None and self._proc.stderr is not None
+        reader = self._proc.stderr
+        while True:
+            line = await reader.readline()
+            if not line:
+                return
+            # Keep stderr drained to avoid deadlocks; log at debug to aid diagnosis.
+            logger.debug("deno stderr: %s", line.decode("utf-8", errors="replace").rstrip())
+
+    async def _deps_install(self, packages: list[str]) -> dict[str, Any]:
+        if not packages:
+            return {"installed": [], "already_present": [], "failed": []}
+        if self._proc is None:
+            await self.start(storage=self._storage)
+
+        req_id = uuid.uuid4().hex
+        timeout = self._config.deps_timeout
+        res = await self._request(
+            {"id": req_id, "type": "deps_install", "packages": list(packages)},
+            timeout=timeout,
+        )
+        if res.get("type") != "deps_install_result":
+            return {
+                "installed": [],
+                "already_present": [],
+                "failed": [f"Unexpected runner response: {res!r}"],
+            }
+        return {
+            "installed": list(res.get("installed") or []),
+            "already_present": list(res.get("already_present") or []),
+            "failed": list(res.get("failed") or []),
+        }
+
+    async def _handle_rpc_request(self, msg: dict[str, Any]) -> None:
+        if self._proc is None or self._proc.stdin is None:
+            return
+
+        req_id = msg.get("id")
+        namespace = msg.get("namespace")
+        op = msg.get("op")
+        # Runner forwards rpc_request from the Pyodide worker. New protocol uses
+        # args_json (string) to avoid structured clone issues with Python proxy
+        # objects. Keep backwards-compat with args (dict) for older runners.
+        args: dict[str, Any]
+        if "args_json" in msg:
+            raw = msg.get("args_json")
+            if not isinstance(raw, str):
+                raw = "{}"
+            try:
+                parsed = json.loads(raw)
+            except Exception:
+                parsed = {}
+            if parsed is None:
+                args = {}
+            elif isinstance(parsed, dict):
+                args = parsed
+            else:
+                args = {}
+        else:
+            raw_args = msg.get("args") or {}
+            args = raw_args if isinstance(raw_args, dict) else {}
+
+        if not isinstance(req_id, str) or not isinstance(namespace, str) or not isinstance(op, str):
+            await self._send(
+                {
+                    "id": str(req_id),
+                    "type": "rpc_response",
+                    "ok": False,
+                    "error": "bad rpc request",
+                }
+            )
+            return
+
+        try:
+            result = await self._dispatch_rpc(namespace, op, args)
+            await self._send({"id": req_id, "type": "rpc_response", "ok": True, "result": result})
+        except Exception as e:
+            await self._send(
+                {
+                    "id": req_id,
+                    "type": "rpc_response",
+                    "ok": False,
+                    "error": {"type": type(e).__name__, "message": str(e)},
+                }
+            )
+
+    async def _dispatch_rpc(self, namespace: str, op: str, args: dict[str, Any]) -> Any:
+        if namespace in ("tools", "workflows", "artifacts"):
+            if self._provider is None:
+                raise RuntimeError("No storage/provider configured")
+
+        if namespace == "tools":
+            if op == "list_tools":
+                return await self._provider.list_tools()
+            if op == "search_tools":
+                return await self._provider.search_tools(args["query"], int(args.get("limit", 10)))
+            if op == "list_tool_recipes":
+                return await self._provider.list_tool_recipes(args["name"])
+            if op == "call_tool":
+                return await self._provider.call_tool(args["name"], args.get("args") or {})
+            raise ValueError(f"unknown tools op: {op}")
+
+        if namespace == "workflows":
+            if op == "list_workflows":
+                return await self._provider.list_workflows()
+            if op == "search_workflows":
+                return await self._provider.search_workflows(
+                    args["query"], int(args.get("limit", 5))
+                )
+            if op == "get_workflow":
+                return await self._provider.get_workflow(args["name"])
+            if op == "create_workflow":
+                return await self._provider.create_workflow(
+                    args["name"], args["source"], args.get("description", "")
+                )
+            if op == "delete_workflow":
+                return await self._provider.delete_workflow(args["name"])
+            raise ValueError(f"unknown workflows op: {op}")
+
+        if namespace == "artifacts":
+            if op == "list_artifacts":
+                return await self._provider.list_artifacts()
+            if op == "get_artifact":
+                return await self._provider.get_artifact(args["name"])
+            if op == "artifact_exists":
+                return await self._provider.artifact_exists(args["name"])
+            if op == "load_artifact":
+                return await self._provider.load_artifact(args["name"])
+            if op == "save_artifact":
+                return await self._provider.save_artifact(
+                    args["name"], args.get("data"), args.get("description", "")
+                )
+            if op == "delete_artifact":
+                await self._provider.delete_artifact(args["name"])
+                return None
+            raise ValueError(f"unknown artifacts op: {op}")
+
+        if namespace == "deps":
+            # Persistence only; sandbox performs actual installs best-effort.
+            if self._deps_store is None:
+                return [] if op == "list_deps" else False
+
+            if op == "list_deps":
+                return self._deps_store.list()
+
+            if op == "persist_add":
+                if not self._config.allow_runtime_deps:
+                    raise RuntimeDepsDisabledError(
+                        "Runtime dependency installation is disabled. "
+                        "Dependencies must be pre-configured before session start."
+                    )
+                spec = args["spec"]
+                self._deps_store.add(spec)
+                return True
+
+            if op == "persist_remove":
+                if not self._config.allow_runtime_deps:
+                    raise RuntimeDepsDisabledError(
+                        "Runtime dependency modification is disabled. "
+                        "Dependencies must be pre-configured before session start."
+                    )
+                name = args["spec_or_name"]
+                return self._deps_store.remove(name)
+
+            raise ValueError(f"unknown deps op: {op}")
+
+        raise ValueError(f"unknown rpc namespace: {namespace}")
+
+    async def _send(self, msg: dict[str, Any]) -> None:
+        if self._proc is None or self._proc.stdin is None:
+            raise RuntimeError("Runner not started")
+        data = (json.dumps(msg, ensure_ascii=True) + "\n").encode("utf-8")
+        self._proc.stdin.write(data)
+        await self._proc.stdin.drain()
+
+    async def _request(self, msg: dict[str, Any], timeout: float | None) -> dict[str, Any]:
+        req_id = msg.get("id")
+        if not isinstance(req_id, str):
+            raise TypeError("request message must include string id")
+        fut: asyncio.Future[dict[str, Any]] = asyncio.get_running_loop().create_future()
+        self._pending[req_id] = _Pending(fut=fut)
+        await self._send(msg)
+
+        if timeout is None:
+            return await fut
+        return await asyncio.wait_for(fut, timeout=timeout)
+
+    async def run(self, code: str, timeout: float | None = None) -> ExecutionResult:
+        if self._closed:
+            return ExecutionResult(value=None, stdout="", error="Executor is closed")
+        if self._proc is None:
+            await self.start(storage=self._storage)
+
+        if self._wedged:
+            return ExecutionResult(
+                value=None,
+                stdout="",
+                error=(
+                    "Previous execution timed out; sandbox may still be running. "
+                    "Call session.reset()."
+                ),
+            )
+
+        effective_timeout = timeout if timeout is not None else self._config.default_timeout
+        req_id = uuid.uuid4().hex
+
+        try:
+            res = await self._request(
+                {"id": req_id, "type": "exec", "code": code},
+                timeout=effective_timeout,
+            )
+        except TimeoutError:
+            self._wedged = True
+            return ExecutionResult(
+                value=None,
+                stdout="",
+                error=(
+                    f"Execution timeout after {effective_timeout} seconds "
+                    "(soft timeout; state preserved if it finishes)."
+                ),
+            )
+
+        if res.get("type") != "exec_result":
+            return ExecutionResult(
+                value=None, stdout="", error=f"Unexpected runner response: {res!r}"
+            )
+
+        return ExecutionResult(
+            value=res.get("value"),
+            stdout=res.get("stdout") or "",
+            error=res.get("error"),
+        )
+
+    async def reset(self) -> None:
+        # Hard reset: restart the Deno subprocess to guarantee recovery.
+        await self._restart()
+
+    async def _restart(self) -> None:
+        await self.close()
+        self._closed = False
+        self._proc = None
+        self._stdout_task = None
+        self._pending.clear()
+        self._wedged = False
+        await self.start(storage=self._storage)
+
+    async def close(self) -> None:
+        if self._proc is not None:
+            try:
+                await self._send({"id": uuid.uuid4().hex, "type": "close"})
+            except Exception:
+                pass
+            try:
+                self._proc.terminate()
+            except ProcessLookupError:
+                pass
+            try:
+                await asyncio.wait_for(self._proc.wait(), timeout=2.0)
+            except Exception:
+                pass
+        if self._stdout_task is not None:
+            self._stdout_task.cancel()
+        if self._stderr_task is not None:
+            self._stderr_task.cancel()
+        if self._tool_registry is not None:
+            await self._tool_registry.close()
+        self._proc = None
+        self._stdout_task = None
+        self._stderr_task = None
+        self._closed = True
+        self._pending.clear()
+        self._wedged = False
+
+    # -------------------------------------------------------------------------
+    # Tools facade (host-side)
+    # -------------------------------------------------------------------------
+
+    async def list_tools(self) -> list[dict[str, Any]]:
+        if self._tool_registry is None:
+            return []
+        return [tool.to_dict() for tool in self._tool_registry.list_tools()]
+
+    async def search_tools(self, query: str, limit: int = 10) -> list[dict[str, Any]]:
+        if self._tool_registry is None:
+            return []
+        return [tool.to_dict() for tool in self._tool_registry.search(query, limit=limit)]
+
+    # -------------------------------------------------------------------------
+    # Deps facade (host persistence + sandbox best-effort install via exec)
+    # -------------------------------------------------------------------------
+
+    async def install_deps(self, packages: list[str]) -> dict[str, Any]:
+        # System-level API (used by Session._sync_deps()).
+        return await self._deps_install(packages)
+
+    async def uninstall_deps(self, packages: list[str]) -> dict[str, Any]:
+        # Pyodide does not reliably support uninstall. We treat this as config removal only.
+        removed: list[str] = []
+        failed: list[str] = []
+        for pkg in packages:
+            try:
+                await self.remove_dep(pkg)
+                removed.append(pkg)
+            except Exception:
+                failed.append(pkg)
+        return {"removed": removed, "not_found": [], "failed": failed}
+
+    async def add_dep(self, package: str) -> dict[str, Any]:
+        if not self._config.allow_runtime_deps:
+            raise RuntimeDepsDisabledError(
+                "Runtime dependency installation is disabled. "
+                "Dependencies must be pre-configured before session start."
+            )
+        if self._deps_store is not None:
+            self._deps_store.add(package)
+        return await self._deps_install([package])
+
+    async def remove_dep(self, package: str) -> dict[str, Any]:
+        if not self._config.allow_runtime_deps:
+            raise RuntimeDepsDisabledError(
+                "Runtime dependency modification is disabled. "
+                "Dependencies must be pre-configured before session start."
+            )
+        removed_from_config = False
+        if self._deps_store is not None:
+            removed_from_config = self._deps_store.remove(package)
+        return {
+            "removed": [package] if removed_from_config else [],
+            "not_found": [] if removed_from_config else [package],
+            "failed": [],
+            "removed_from_config": removed_from_config,
+        }
+
+    async def list_deps(self) -> list[str]:
+        if self._deps_store is None:
+            return []
+        return self._deps_store.list()
+
+    async def sync_deps(self) -> dict[str, Any]:
+        if self._deps_store is None:
+            return {"installed": [], "already_present": [], "failed": []}
+        return await self._deps_install(self._deps_store.list())
+
+
+register_backend("deno-sandbox", DenoSandboxExecutor)
diff --git a/src/py_code_mode/execution/deno_sandbox/runner/main.ts b/src/py_code_mode/execution/deno_sandbox/runner/main.ts
new file mode 100644
index 0000000..4e53bf4
--- /dev/null
+++ b/src/py_code_mode/execution/deno_sandbox/runner/main.ts
@@ -0,0 +1,314 @@
+// NDJSON protocol runner: host (Python) <-> Deno main <-> Pyodide worker.
+//
+// This is dependency-light. The only external dependency should come from
+// worker.ts (npm:pyodide). We rely on `deno cache` being run outside the
+// sandbox so the sandboxed runner can use `--cached-only` and `--deny-net`.
+
+type Req =
+  | { id: string; type: "init" }
+  | { id: string; type: "exec"; code: string }
+  | { id: string; type: "deps_install"; packages: string[] }
+  | { id: string; type: "reset" }
+  | { id: string; type: "close" }
+  | {
+    id: string;
+    type: "rpc_response";
+    ok: boolean;
+    result?: unknown;
+    error?: unknown;
+  };
+
+type Resp =
+  | { id: string; type: "ready" }
+  | {
+    id: string;
+    type: "exec_result";
+    stdout: string;
+    value: unknown;
+    error: string | null;
+  }
+  | {
+    id: string;
+    type: "deps_install_result";
+    installed: string[];
+    already_present: string[];
+    failed: string[];
+  }
+  | {
+    id: string;
+    type: "rpc_request";
+    namespace: string;
+    op: string;
+    args_json: string;
+  }
+  | { id: string; type: "error"; message: string };
+
+function writeMsg(msg: Resp) {
+  Deno.stdout.writeSync(new TextEncoder().encode(JSON.stringify(msg) + "\n"));
+}
+
+async function* readNdjsonLines(): AsyncGenerator<string> {
+  const decoder = new TextDecoder();
+  let buf = "";
+  for await (const chunk of Deno.stdin.readable) {
+    buf += decoder.decode(chunk, { stream: true });
+    while (true) {
+      const idx = buf.indexOf("\n");
+      if (idx < 0) break;
+      const line = buf.slice(0, idx);
+      buf = buf.slice(idx + 1);
+      yield line;
+    }
+  }
+  if (buf) yield buf;
+}
+
+function newWorker(): Worker {
+  const worker = new Worker(new URL("./worker.ts", import.meta.url), {
+    type: "module",
+    deno: { namespace: true },
+  });
+  worker.postMessage({
+    type: "boot",
+  });
+  return worker;
+}
+
+let worker: Worker | null = null;
+let workerBootError: string | null = null;
+let workerReady = false;
+let bootWait: Promise<void> | null = null;
+let bootResolve: (() => void) | null = null;
+let bootReject: ((e: unknown) => void) | null = null;
+
+const execPending = new Map<
+  string,
+  { resolve: (v: any) => void; reject: (e: any) => void }
+>();
+
+function ensureWorker() {
+  if (!worker) worker = newWorker();
+}
+
+function resetWorker() {
+  if (worker) worker.terminate();
+  worker = newWorker();
+  workerBootError = null;
+  workerReady = false;
+  bootWait = new Promise<void>((resolve, reject) => {
+    bootResolve = resolve;
+    bootReject = reject;
+  });
+}
+
+function callExec(id: string, code: string): Promise<any> {
+  ensureWorker();
+  return new Promise((resolve, reject) => {
+    if (workerBootError) return reject(new Error(workerBootError));
+    execPending.set(id, { resolve, reject });
+    worker!.postMessage({ type: "exec", id, code });
+  });
+}
+
+function callDepsInstall(id: string, packages: string[]): Promise<any> {
+  ensureWorker();
+  return new Promise((resolve, reject) => {
+    if (workerBootError) return reject(new Error(workerBootError));
+    execPending.set(id, { resolve, reject });
+    worker!.postMessage({ type: "deps_install", id, packages });
+  });
+}
+
+function attachWorkerHandler() {
+  if (!worker) return;
+  worker.onmessage = (ev: MessageEvent<any>) => {
+    const msg = ev.data;
+    if (!msg || typeof msg !== "object") return;
+
+    if (msg.type === "boot_ok") {
+      workerReady = true;
+      bootResolve?.();
+      bootResolve = null;
+      bootReject = null;
+      return;
+    }
+
+    if (msg.type === "boot_error") {
+      workerBootError = String(msg.error ?? "boot failed");
+      workerReady = false;
+      bootReject?.(new Error(workerBootError));
+      bootResolve = null;
+      bootReject = null;
+      for (const [id, pending] of execPending) {
+        pending.reject(new Error(workerBootError));
+        execPending.delete(id);
+      }
+      writeMsg({ id: "worker", type: "error", message: workerBootError });
+      return;
+    }
+
+    if (msg.type === "exec_result") {
+      const pending = execPending.get(msg.id);
+      if (pending) {
+        execPending.delete(msg.id);
+        pending.resolve(msg);
+      }
+      return;
+    }
+
+    if (msg.type === "deps_install_result") {
+      const pending = execPending.get(msg.id);
+      if (pending) {
+        execPending.delete(msg.id);
+        pending.resolve(msg);
+      }
+      return;
+    }
+
+    if (msg.type === "rpc_request") {
+      // args_json is required to avoid DataCloneError (Pyodide dict proxies are not cloneable).
+      writeMsg({
+        id: msg.id,
+        type: "rpc_request",
+        namespace: msg.namespace,
+        op: msg.op,
+        args_json: String(msg.args_json ?? "{}"),
+      });
+      return;
+    }
+
+    // Streamed RPC response from host -> runner -> worker.
+    // Note: worker only sends rpc_request messages.
+  };
+
+  worker.onerror = (e) => {
+    const m = String((e as any).message ?? e);
+    workerBootError = m;
+    workerReady = false;
+    bootReject?.(new Error(m));
+    bootResolve = null;
+    bootReject = null;
+    for (const [id, pending] of execPending) {
+      pending.reject(new Error(m));
+      execPending.delete(id);
+    }
+    writeMsg({ id: "worker", type: "error", message: m });
+  };
+}
+
+// Ensure exec/deps_install are single-flight, but don't block stdin processing:
+// the worker needs rpc_response messages to arrive while code is running.
+let runChain: Promise<unknown> = Promise.resolve();
+function enqueueRun(fn: () => Promise<void>) {
+  const p = runChain.then(fn, fn);
+  runChain = p.catch(() => {});
+}
+
+async function handleReq(req: Req) {
+  try {
+    if (req.type === "rpc_response") {
+      // Forward as chunks to avoid fixed-size transport limits.
+      ensureWorker();
+      const payload = JSON.stringify(
+        req.ok ? { ok: true, result: req.result } : {
+          ok: false,
+          error: req.error,
+        },
+      );
+
+      const chunkSize = 64 * 1024;
+      let seq = 0;
+      for (let off = 0; off < payload.length; off += chunkSize) {
+        const chunk = payload.slice(off, off + chunkSize);
+        worker!.postMessage({
+          type: "rpc_response_chunk",
+          id: req.id,
+          seq,
+          chunk,
+        });
+        seq += 1;
+      }
+      worker!.postMessage({ type: "rpc_response_end", id: req.id, seq });
+      return;
+    }
+
+    if (req.type === "init") {
+      resetWorker();
+      attachWorkerHandler();
+      if (bootWait) await bootWait;
+      writeMsg({ id: req.id, type: "ready" });
+      return;
+    }
+
+    if (req.type === "reset") {
+      resetWorker();
+      attachWorkerHandler();
+      if (bootWait) await bootWait;
+      writeMsg({ id: req.id, type: "ready" });
+      return;
+    }
+
+    if (req.type === "exec") {
+      enqueueRun(async () => {
+        if (bootWait) await bootWait;
+        const res = await callExec(req.id, req.code);
+        writeMsg({
+          id: req.id,
+          type: "exec_result",
+          stdout: res.stdout ?? "",
+          value: res.value ?? null,
+          error: res.error ?? null,
+        });
+      });
+      return;
+    }
+
+    if (req.type === "deps_install") {
+      enqueueRun(async () => {
+        if (bootWait) await bootWait;
+        const res = await callDepsInstall(req.id, req.packages ?? []);
+        writeMsg({
+          id: req.id,
+          type: "deps_install_result",
+          installed: res.installed ?? [],
+          already_present: res.already_present ?? [],
+          failed: res.failed ?? [],
+        });
+      });
+      return;
+    }
+  } catch (e) {
+    writeMsg({
+      id: req.id,
+      type: "error",
+      message: String((e as any)?.stack ?? e),
+    });
+  }
+}
+
+for await (const line of readNdjsonLines()) {
+  if (!line.trim()) continue;
+  let req: Req;
+  try {
+    req = JSON.parse(line);
+  } catch (e) {
+    writeMsg({
+      id: "parse",
+      type: "error",
+      message: `invalid json: ${String(e)}`,
+    });
+    continue;
+  }
+
+  if (req.type === "close") {
+    try {
+      if (worker) worker.terminate();
+      worker = null;
+      writeMsg({ id: req.id, type: "ready" });
+    } finally {
+      break;
+    }
+  }
+
+  void handleReq(req);
+}
diff --git a/src/py_code_mode/execution/deno_sandbox/runner/worker.ts b/src/py_code_mode/execution/deno_sandbox/runner/worker.ts
new file mode 100644
index 0000000..d0257f0
--- /dev/null
+++ b/src/py_code_mode/execution/deno_sandbox/runner/worker.ts
@@ -0,0 +1,431 @@
+// Pyodide worker. Executes Python code and provides async RPC calls
+// back to the Deno main thread (which forwards to the Python host).
+//
+// RPC is promise-based and supports arbitrarily large payloads by streaming
+// chunks over postMessage (runner -> worker).
+
+import { loadPyodide } from "npm:pyodide@0.29.3";
+
+// Keep stdout/stderr reserved for the NDJSON protocol in main.ts.
+// Pyodide and micropip can be chatty, and interleaved output would corrupt NDJSON.
+const _noop = () => {};
+console.log = _noop;
+console.info = _noop;
+console.warn = _noop;
+console.debug = _noop;
+console.error = _noop;
+
+type BootMsg = { type: "boot" };
+type ExecMsg = { type: "exec"; id: string; code: string };
+type DepsInstallMsg = { type: "deps_install"; id: string; packages: string[] };
+
+type RpcResponseChunkMsg = {
+  type: "rpc_response_chunk";
+  id: string;
+  seq: number;
+  chunk: string;
+};
+type RpcResponseEndMsg = { type: "rpc_response_end"; id: string; seq: number };
+
+type RpcReq = {
+  type: "rpc_request";
+  id: string;
+  namespace: string;
+  op: string;
+  args_json: string;
+};
+
+type Msg =
+  | BootMsg
+  | ExecMsg
+  | DepsInstallMsg
+  | RpcResponseChunkMsg
+  | RpcResponseEndMsg;
+
+const rpcPending = new Map<
+  string,
+  { chunks: string[]; resolve: (v: string) => void; reject: (e: Error) => void }
+>();
+
+function rpcCallAsync(
+  namespace: string,
+  op: string,
+  argsJson: string,
+): Promise<string> {
+  const id = crypto.randomUUID();
+  const msg: RpcReq = {
+    type: "rpc_request",
+    id,
+    namespace,
+    op,
+    args_json: String(argsJson ?? "{}"),
+  };
+
+  return new Promise((resolve, reject) => {
+    rpcPending.set(id, { chunks: [], resolve, reject });
+    (self as any).postMessage(msg);
+  });
+}
+
+function pyodidePackageDir(): string {
+  // Resolve a file inside the npm package, then derive its directory path.
+  const resolved = import.meta.resolve("npm:pyodide@0.29.3/pyodide.asm.js");
+  if (resolved.startsWith("file:")) {
+    const u = new URL(resolved);
+    // Deno uses POSIX paths on macOS/Linux.
+    const path = decodeURIComponent(u.pathname);
+    return path.slice(0, path.lastIndexOf("/") + 1);
+  }
+  // Fallback: treat as path-like.
+  const s = String(resolved);
+  return s.slice(0, s.lastIndexOf("/") + 1);
+}
+
+let pyodide: any = null;
+let booted = false;
+let micropipLoaded = false;
+const attemptedInstalls = new Set<string>();
+
+async function ensureBooted() {
+  if (booted) return;
+
+  const indexURL = pyodidePackageDir();
+  pyodide = await loadPyodide({ indexURL, stdout: _noop, stderr: _noop });
+
+  // Expose async RPC to Python.
+  (self as any).rpc_call_async = rpcCallAsync;
+
+  // Expose deps installers to Python (so deps.add/sync can just await these).
+  (self as any).pycm_install_package = installPackage;
+  (self as any).pycm_install_packages = installPackages;
+
+  const bootstrap = `
+import ast, json
+
+class _RPC:
+    @staticmethod
+    async def call(namespace: str, op: str, args: dict):
+        import js
+        payload = await js.rpc_call_async(namespace, op, json.dumps(args))
+        obj = json.loads(str(payload))
+        if not obj.get("ok", False):
+            err = obj.get("error") or {}
+            raise RuntimeError(f"RPCError: {err.get('message','unknown')}")
+        return obj.get("result")
+
+class _ToolCallable:
+    def __init__(self, name: str, recipe: str | None = None):
+        self._name = name
+        self._recipe = recipe
+    async def __call__(self, **kwargs):
+        tool = self._name if self._recipe is None else f"{self._name}.{self._recipe}"
+        return await _RPC.call("tools", "call_tool", {"name": tool, "args": kwargs})
+
+class _Tool:
+    def __init__(self, name: str):
+        self._name = name
+    async def __call__(self, **kwargs):
+        return await _RPC.call("tools", "call_tool", {"name": self._name, "args": kwargs})
+    def __getattr__(self, recipe: str):
+        if recipe.startswith("_"):
+            raise AttributeError(recipe)
+        return _ToolCallable(self._name, recipe)
+    async def list(self):
+        return await _RPC.call("tools", "list_tool_recipes", {"name": self._name})
+
+class _Tools:
+    def __getattr__(self, name: str):
+        if name.startswith("_"):
+            raise AttributeError(name)
+        return _Tool(name)
+    async def list(self):
+        return await _RPC.call("tools", "list_tools", {})
+    async def search(self, query: str, limit: int = 5):
+        return await _RPC.call("tools", "search_tools", {"query": query, "limit": limit})
+
+tools = _Tools()
+
+class workflows:
+    @staticmethod
+    async def list():
+        return await _RPC.call("workflows", "list_workflows", {})
+    @staticmethod
+    async def search(query: str, limit: int = 5):
+        return await _RPC.call("workflows", "search_workflows", {"query": query, "limit": limit})
+    @staticmethod
+    async def get(name: str):
+        return await _RPC.call("workflows", "get_workflow", {"name": name})
+    @staticmethod
+    async def create(name: str, source: str, description: str = ""):
+        return await _RPC.call("workflows", "create_workflow", {"name": name, "source": source, "description": description})
+    @staticmethod
+    async def delete(name: str):
+        return await _RPC.call("workflows", "delete_workflow", {"name": name})
+    @staticmethod
+    async def invoke(workflow_name: str, **kwargs):
+        import asyncio
+        wf = await workflows.get(workflow_name)
+        if wf is None or not isinstance(wf, dict):
+            raise ValueError(f"Workflow not found: {workflow_name}")
+        source = wf.get("source")
+        if not source:
+            raise ValueError(f"Workflow has no source: {workflow_name}")
+        ns = {"tools": tools, "workflows": workflows, "artifacts": artifacts, "deps": deps}
+        exec(source, ns, ns)
+        run_func = ns.get("run")
+        if not callable(run_func):
+            raise ValueError(f"Workflow {workflow_name} has no run() function")
+        result = run_func(**kwargs)
+        if asyncio.iscoroutine(result):
+            result = await result
+        return result
+
+class artifacts:
+    @staticmethod
+    async def list():
+        return await _RPC.call("artifacts", "list_artifacts", {})
+    @staticmethod
+    async def get(name: str):
+        return await _RPC.call("artifacts", "get_artifact", {"name": name})
+    @staticmethod
+    async def exists(name: str):
+        return await _RPC.call("artifacts", "artifact_exists", {"name": name})
+    @staticmethod
+    async def load(name: str):
+        return await _RPC.call("artifacts", "load_artifact", {"name": name})
+    @staticmethod
+    async def save(name: str, data, description: str = ""):
+        return await _RPC.call("artifacts", "save_artifact", {"name": name, "data": data, "description": description})
+    @staticmethod
+    async def delete(name: str):
+        return await _RPC.call("artifacts", "delete_artifact", {"name": name})
+
+class deps:
+    @staticmethod
+    async def list():
+        return await _RPC.call("deps", "list_deps", {})
+    @staticmethod
+    async def add(spec: str):
+        await _RPC.call("deps", "persist_add", {"spec": spec})
+        import js
+        ok = await js.pycm_install_package(spec)
+        if ok:
+            return {"installed": [spec], "already_present": [], "failed": []}
+        return {"installed": [], "already_present": [], "failed": [spec]}
+    @staticmethod
+    async def remove(spec_or_name: str):
+        removed = await _RPC.call("deps", "persist_remove", {"spec_or_name": spec_or_name})
+        return {
+            "removed": [spec_or_name] if removed else [],
+            "not_found": [] if removed else [spec_or_name],
+            "failed": [],
+            "removed_from_config": bool(removed),
+        }
+    @staticmethod
+    async def sync():
+        specs = await _RPC.call("deps", "list_deps", {}) or []
+        import js
+        res = await js.pycm_install_packages(list(specs))
+        return res
+`;
+
+  pyodide.runPython(bootstrap);
+  booted = true;
+}
+
+async function ensureMicropipLoaded(): Promise<void> {
+  if (micropipLoaded) return;
+  if (!pyodide) throw new Error("pyodide not initialized");
+  await pyodide.loadPackage("micropip");
+  micropipLoaded = true;
+}
+
+async function installPackage(spec: string): Promise<boolean> {
+  const s = String(spec ?? "").trim();
+  if (!s) return false;
+  if (attemptedInstalls.has(s)) return true;
+
+  await ensureMicropipLoaded();
+  try {
+    pyodide.globals.set("_PYCM_DEP_SPEC", s);
+    await pyodide.runPythonAsync(`
+import micropip
+await micropip.install(_PYCM_DEP_SPEC)
+`);
+    attemptedInstalls.add(s);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+async function installPackages(
+  packages: string[],
+): Promise<
+  { installed: string[]; already_present: string[]; failed: string[] }
+> {
+  const installed: string[] = [];
+  const already_present: string[] = [];
+  const failed: string[] = [];
+
+  for (const p of packages ?? []) {
+    const spec = String(p ?? "").trim();
+    if (!spec) continue;
+    if (attemptedInstalls.has(spec)) {
+      already_present.push(spec);
+      continue;
+    }
+    const ok = await installPackage(spec);
+    if (ok) installed.push(spec);
+    else failed.push(spec);
+  }
+
+  return { installed, already_present, failed };
+}
+
+async function runWithLastExprAsync(
+  code: string,
+): Promise<{ stdout: string; value: any; error: string | null }> {
+  const wrapper = `
+import ast, asyncio, io, sys, traceback
+_stdout = io.StringIO()
+_value = None
+_error = None
+
+async def _pycm_exec(_CODE: str):
+    global _value, _error
+    try:
+        _tree = ast.parse(_CODE)
+        if _tree.body and isinstance(_tree.body[-1], ast.Expr):
+            _stmts = _tree.body[:-1]
+            _expr = _tree.body[-1].value
+            if _stmts:
+                _m = ast.Module(body=_stmts, type_ignores=[])
+                _c = compile(_m, "<code>", "exec", flags=ast.PyCF_ALLOW_TOP_LEVEL_AWAIT)
+                _old = sys.stdout
+                sys.stdout = _stdout
+                try:
+                    _r = eval(_c, globals(), globals())
+                    if asyncio.iscoroutine(_r):
+                        await _r
+                finally:
+                    sys.stdout = _old
+            _ec = compile(ast.Expression(body=_expr), "<expr>", "eval", flags=ast.PyCF_ALLOW_TOP_LEVEL_AWAIT)
+            _old = sys.stdout
+            sys.stdout = _stdout
+            try:
+                _r2 = eval(_ec, globals(), globals())
+                if asyncio.iscoroutine(_r2):
+                    _r2 = await _r2
+                _value = _r2
+            finally:
+                sys.stdout = _old
+        else:
+            _c = compile(_tree, "<code>", "exec", flags=ast.PyCF_ALLOW_TOP_LEVEL_AWAIT)
+            _old = sys.stdout
+            sys.stdout = _stdout
+            try:
+                _r = eval(_c, globals(), globals())
+                if asyncio.iscoroutine(_r):
+                    await _r
+            finally:
+                sys.stdout = _old
+            _value = None
+    except Exception:
+        _error = traceback.format_exc()
+
+await _pycm_exec(_CODE)
+`;
+
+  if (!pyodide) throw new Error("pyodide not initialized");
+  pyodide.globals.set("_CODE", code);
+  await pyodide.runPythonAsync(wrapper);
+
+  const stdout = pyodide.globals.get("_stdout").getvalue();
+  const error = pyodide.globals.get("_error");
+
+  let outValue: any;
+  try {
+    const jsonTxt = pyodide.runPython(
+      "import json; json.dumps(_value)",
+    ) as string;
+    outValue = JSON.parse(String(jsonTxt));
+  } catch {
+    const repr = pyodide.runPython("repr(_value)") as string;
+    outValue = { __py_repr__: String(repr) };
+  }
+
+  return {
+    stdout: String(stdout ?? ""),
+    value: outValue ?? null,
+    error: error ? String(error) : null,
+  };
+}
+
+self.onmessage = async (ev: MessageEvent<Msg>) => {
+  const msg = ev.data as any;
+
+  if (msg.type === "rpc_response_chunk") {
+    const p = rpcPending.get(msg.id);
+    if (!p) return;
+    p.chunks.push(String(msg.chunk ?? ""));
+    return;
+  }
+
+  if (msg.type === "rpc_response_end") {
+    const p = rpcPending.get(msg.id);
+    if (!p) return;
+    rpcPending.delete(msg.id);
+    p.resolve(p.chunks.join(""));
+    return;
+  }
+
+  if (msg.type === "boot") {
+    try {
+      await ensureBooted();
+      (self as any).postMessage({ type: "boot_ok" });
+    } catch (e) {
+      (self as any).postMessage({
+        type: "boot_error",
+        error: String((e as any)?.stack ?? e),
+      });
+    }
+    return;
+  }
+
+  if (msg.type === "exec") {
+    try {
+      const res = await runWithLastExprAsync(msg.code);
+      (self as any).postMessage({ type: "exec_result", id: msg.id, ...res });
+    } catch (e) {
+      (self as any).postMessage({
+        type: "exec_result",
+        id: msg.id,
+        stdout: "",
+        value: null,
+        error: String((e as any)?.stack ?? e),
+      });
+    }
+    return;
+  }
+
+  if (msg.type === "deps_install") {
+    try {
+      const res = await installPackages(msg.packages ?? []);
+      (self as any).postMessage({
+        type: "deps_install_result",
+        id: msg.id,
+        ...res,
+      });
+    } catch (e) {
+      (self as any).postMessage({
+        type: "deps_install_result",
+        id: msg.id,
+        installed: [],
+        already_present: [],
+        failed: (msg.packages ?? []).map((p: any) => String(p)),
+        error: String((e as any)?.stack ?? e),
+      });
+    }
+  }
+};
diff --git a/src/py_code_mode/execution/in_process/executor.py b/src/py_code_mode/execution/in_process/executor.py
index ba43519..999501e 100644
--- a/src/py_code_mode/execution/in_process/executor.py
+++ b/src/py_code_mode/execution/in_process/executor.py
@@ -17,6 +17,7 @@
 from contextlib import redirect_stdout
 from typing import TYPE_CHECKING, Any
 
+from py_code_mode.artifacts import ArtifactsNamespace
 from py_code_mode.deps import (
     ControlledDepsNamespace,
     DepsNamespace,
@@ -102,7 +103,7 @@ def __init__(
 
         # Inject artifacts namespace if artifact_store provided
         if artifact_store is not None:
-            self._namespace["artifacts"] = artifact_store
+            self._namespace["artifacts"] = ArtifactsNamespace(artifact_store)
 
         # Inject deps namespace if provided (wrap if runtime deps disabled)
         if deps_namespace is not None:
@@ -151,17 +152,22 @@ async def run(self, code: str, timeout: float | None = None) -> ExecutionResult:
 
         timeout = timeout if timeout is not None else self._default_timeout
 
-        # Store loop reference for tool/workflow calls from thread context
-        loop = asyncio.get_running_loop()
-        if "tools" in self._namespace:
-            self._namespace["tools"].set_loop(loop)
-        if "workflows" in self._namespace:
-            self._namespace["workflows"].set_loop(loop)
+        sync_mode = not self._requires_top_level_await(code)
+
+        # Store loop reference for tool calls from thread context.
+        # Only used for the sync execution path; the async path executes in its
+        # own event loop in the worker thread.
+        if sync_mode:
+            loop = asyncio.get_running_loop()
+            if "tools" in self._namespace:
+                self._namespace["tools"].set_loop(loop)
 
         # Run in thread to allow timeout cancellation
         try:
             return await asyncio.wait_for(
-                asyncio.to_thread(self._run_sync, code),
+                asyncio.to_thread(self._run_sync, code)
+                if sync_mode
+                else asyncio.to_thread(self._run_async_in_thread, code),
                 timeout=timeout,
             )
         except TimeoutError:
@@ -171,6 +177,19 @@ async def run(self, code: str, timeout: float | None = None) -> ExecutionResult:
                 error=f"Execution timeout after {timeout} seconds",
             )
 
+    @staticmethod
+    def _requires_top_level_await(code: str) -> bool:
+        """Return True if code needs PyCF_ALLOW_TOP_LEVEL_AWAIT to compile."""
+        try:
+            compile(code, "<code>", "exec")
+            return False
+        except (SyntaxError, RecursionError):
+            try:
+                compile(code, "<code>", "exec", flags=ast.PyCF_ALLOW_TOP_LEVEL_AWAIT)
+                return True
+            except (SyntaxError, RecursionError):
+                return False
+
     def _run_sync(self, code: str) -> ExecutionResult:
         """Run code synchronously, capturing output."""
         stdout_capture = io.StringIO()
@@ -218,6 +237,52 @@ def _run_sync(self, code: str) -> ExecutionResult:
                 error=traceback.format_exc(),
             )
 
+    def _run_async_in_thread(self, code: str) -> ExecutionResult:
+        """Execute code in a fresh event loop (supports top-level await)."""
+        try:
+            return asyncio.run(self._run_async(code))
+        except Exception:
+            return ExecutionResult(value=None, stdout="", error=traceback.format_exc())
+
+    async def _run_async(self, code: str) -> ExecutionResult:
+        """Run code allowing top-level await, preserving last-expression semantics."""
+        stdout_capture = io.StringIO()
+        try:
+            tree = ast.parse(code)
+            flags = ast.PyCF_ALLOW_TOP_LEVEL_AWAIT
+
+            with redirect_stdout(stdout_capture):
+                if tree.body and isinstance(tree.body[-1], ast.Expr):
+                    stmts = tree.body[:-1]
+                    expr = tree.body[-1]
+
+                    if stmts:
+                        stmt_tree = ast.Module(body=stmts, type_ignores=[])
+                        stmt_code = compile(stmt_tree, "<code>", "exec", flags=flags)
+                        maybe = _eval_code(stmt_code, self._namespace, self._namespace)
+                        if asyncio.iscoroutine(maybe):
+                            await maybe
+
+                    expr_tree = ast.Expression(body=expr.value)
+                    expr_code = compile(expr_tree, "<expr>", "eval", flags=flags)
+                    value = _eval_code(expr_code, self._namespace, self._namespace)
+                    if asyncio.iscoroutine(value):
+                        value = await value
+                else:
+                    stmt_code = compile(tree, "<code>", "exec", flags=flags)
+                    maybe = _eval_code(stmt_code, self._namespace, self._namespace)
+                    if asyncio.iscoroutine(maybe):
+                        await maybe
+                    value = None
+
+            return ExecutionResult(value=value, stdout=stdout_capture.getvalue(), error=None)
+        except Exception:
+            return ExecutionResult(
+                value=None,
+                stdout=stdout_capture.getvalue(),
+                error=traceback.format_exc(),
+            )
+
     async def close(self) -> None:
         """Release executor resources."""
         self._closed = True
@@ -315,7 +380,7 @@ async def start(
             )
 
             self._artifact_store = storage.get_artifact_store()
-            self._namespace["artifacts"] = self._artifact_store
+            self._namespace["artifacts"] = ArtifactsNamespace(self._artifact_store)
         elif self._workflow_library is not None:
             # Use workflow_library from __init__ if provided
             self._namespace["workflows"] = WorkflowsNamespace(
@@ -324,7 +389,7 @@ async def start(
 
         if storage is None and self._artifact_store is not None:
             # Use artifact_store from __init__ if provided
-            self._namespace["artifacts"] = self._artifact_store
+            self._namespace["artifacts"] = ArtifactsNamespace(self._artifact_store)
 
     async def install_deps(self, packages: list[str]) -> dict[str, Any]:
         """Install packages in the in-process environment.
diff --git a/src/py_code_mode/execution/in_process/workflows_namespace.py b/src/py_code_mode/execution/in_process/workflows_namespace.py
index 4bbf680..bef9125 100644
--- a/src/py_code_mode/execution/in_process/workflows_namespace.py
+++ b/src/py_code_mode/execution/in_process/workflows_namespace.py
@@ -6,7 +6,6 @@
 
 from __future__ import annotations
 
-import asyncio
 import builtins
 import inspect
 from typing import TYPE_CHECKING, Any
@@ -46,15 +45,8 @@ def __init__(self, library: WorkflowLibrary, namespace: dict[str, Any]) -> None:
 
         self._library = library
         self._namespace = namespace
-        self._loop: asyncio.AbstractEventLoop | None = None
-
-    def set_loop(self, loop: asyncio.AbstractEventLoop) -> None:
-        """Set the event loop to use for async workflow invocations.
-
-        When code runs in a thread (via asyncio.to_thread), we need a reference
-        to the main event loop to execute async workflows via run_coroutine_threadsafe.
-        """
-        self._loop = loop
+        # Intentionally synchronous surface. Async workflows are supported via
+        # asyncio.run(...) when invoked from sync code (the default execution mode).
 
     @property
     def library(self) -> WorkflowLibrary:
@@ -65,7 +57,7 @@ def library(self) -> WorkflowLibrary:
         return self._library
 
     def search(self, query: str, limit: int = 10) -> builtins.list[dict[str, Any]]:
-        """Search for workflows matching query. Returns simplified workflow info."""
+        """Search for workflows matching query."""
         workflows = self._library.search(query, limit)
         return [self._simplify(w) for w in workflows]
 
@@ -74,7 +66,7 @@ def get(self, name: str) -> Any:
         return self._library.get(name)
 
     def list(self) -> builtins.list[dict[str, Any]]:
-        """List all available workflows. Returns simplified workflow info."""
+        """List all available workflows."""
         workflows = self._library.list()
         return [self._simplify(w) for w in workflows]
 
@@ -168,10 +160,11 @@ def invoke(self, workflow_name: str, **kwargs: Any) -> Any:
         result = run_func(**kwargs)
 
         if inspect.iscoroutine(result):
-            try:
-                asyncio.get_running_loop()
-            except RuntimeError:
-                return asyncio.run(result)
-            raise RuntimeError("Cannot invoke async workflows from a running event loop")
+            # Default agent code execution runs in a worker thread without a
+            # running event loop, so asyncio.run(...) is safe and yields a
+            # synchronous result.
+            import asyncio
+
+            return asyncio.run(result)
 
         return result
diff --git a/src/py_code_mode/execution/resource_provider.py b/src/py_code_mode/execution/resource_provider.py
new file mode 100644
index 0000000..baa7867
--- /dev/null
+++ b/src/py_code_mode/execution/resource_provider.py
@@ -0,0 +1,284 @@
+"""Host-side ResourceProvider for sandboxed executors.
+
+This module contains the provider used by isolated runtimes to access
+tools/workflows/artifacts/deps via RPC.
+
+Today SubprocessExecutor uses this to service kernel-side proxy namespaces.
+The Deno/Pyodide executor will reuse the same provider to avoid duplicating
+behavior across backends.
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import TYPE_CHECKING, Any
+
+from py_code_mode.deps import DepsStore
+from py_code_mode.tools import ToolRegistry
+
+if TYPE_CHECKING:
+    from py_code_mode.execution.subprocess.venv import KernelVenv, VenvManager
+    from py_code_mode.storage.backends import StorageBackend
+
+logger = logging.getLogger(__name__)
+
+
+class StorageResourceProvider:
+    """ResourceProvider that bridges RPC to storage backend.
+
+    Delegates to:
+    - tool_registry (executor-owned, from config.tools_path)
+    - storage backend (workflows + artifacts)
+    - deps_store (executor-owned, from config.deps/deps_file)
+
+    Notes:
+    - For SubprocessExecutor, deps installation uses VenvManager.
+    - For other executors (e.g., Deno/Pyodide), deps ops may be mediated
+      differently; those executors can ignore the venv fields or provide their own.
+    """
+
+    def __init__(
+        self,
+        storage: StorageBackend,
+        tool_registry: ToolRegistry | None = None,
+        deps_store: DepsStore | None = None,
+        allow_runtime_deps: bool = True,
+        venv_manager: VenvManager | None = None,
+        venv: KernelVenv | None = None,
+    ) -> None:
+        self._storage = storage
+        self._tool_registry = tool_registry
+        self._deps_store = deps_store
+        self._allow_runtime_deps = allow_runtime_deps
+        self._venv_manager = venv_manager
+        self._venv = venv
+        self._workflow_library = None  # lazy
+
+    def _get_tool_registry(self) -> ToolRegistry | None:
+        return self._tool_registry
+
+    def _get_workflow_library(self):
+        if self._workflow_library is None:
+            self._workflow_library = self._storage.get_workflow_library()
+        return self._workflow_library
+
+    # -------------------------------------------------------------------------
+    # Tool methods
+    # -------------------------------------------------------------------------
+
+    async def call_tool(self, name: str, args: dict[str, Any]) -> Any:
+        registry = self._get_tool_registry()
+        if registry is None:
+            raise ValueError("No tools configured")
+
+        if "." in name:
+            tool_name, recipe_name = name.split(".", 1)
+        else:
+            tool_name = name
+            recipe_name = None
+
+        return await registry.call_tool(tool_name, recipe_name, args)
+
+    async def list_tools(self) -> list[dict[str, Any]]:
+        registry = self._get_tool_registry()
+        if registry is None:
+            return []
+        return [tool.to_dict() for tool in registry.list_tools()]
+
+    async def search_tools(self, query: str, limit: int) -> list[dict[str, Any]]:
+        registry = self._get_tool_registry()
+        if registry is None:
+            return []
+        return [tool.to_dict() for tool in registry.search(query, limit=limit)]
+
+    async def list_tool_recipes(self, name: str) -> list[dict[str, Any]]:
+        registry = self._get_tool_registry()
+        if registry is None:
+            raise ValueError("No tools configured")
+
+        all_tools = registry.get_all_tools()
+        tool = next((t for t in all_tools if t.name == name), None)
+        if tool is None:
+            raise ValueError(f"Unknown tool: {name}")
+
+        return [{"name": c.name, "description": c.description or ""} for c in tool.callables]
+
+    # -------------------------------------------------------------------------
+    # Workflow methods
+    # -------------------------------------------------------------------------
+
+    async def search_workflows(self, query: str, limit: int) -> list[dict[str, Any]]:
+        library = self._get_workflow_library()
+        library.refresh()
+        workflows = library.search(query, limit=limit)
+        return [
+            {
+                "name": w.name,
+                "description": w.description,
+                "params": {p.name: p.description or p.type for p in w.parameters},
+            }
+            for w in workflows
+        ]
+
+    async def list_workflows(self) -> list[dict[str, Any]]:
+        library = self._get_workflow_library()
+        library.refresh()
+        workflows = library.list()
+        return [
+            {
+                "name": w.name,
+                "description": w.description,
+                "params": {p.name: p.description or p.type for p in w.parameters},
+            }
+            for w in workflows
+        ]
+
+    async def get_workflow(self, name: str) -> dict[str, Any] | None:
+        library = self._get_workflow_library()
+        library.refresh()
+        workflow = library.get(name)
+        if workflow is None:
+            return None
+        return {
+            "name": workflow.name,
+            "description": workflow.description,
+            "source": workflow.source,
+            "params": {p.name: p.description or p.type for p in workflow.parameters},
+        }
+
+    async def create_workflow(self, name: str, source: str, description: str) -> dict[str, Any]:
+        from py_code_mode.workflows import PythonWorkflow
+
+        workflow = PythonWorkflow.from_source(
+            name=name,
+            source=source,
+            description=description,
+        )
+
+        library = self._get_workflow_library()
+        library.add(workflow)
+
+        return {
+            "name": workflow.name,
+            "description": workflow.description,
+            "params": {p.name: p.description or p.type for p in workflow.parameters},
+        }
+
+    async def delete_workflow(self, name: str) -> bool:
+        library = self._get_workflow_library()
+        return library.remove(name)
+
+    # -------------------------------------------------------------------------
+    # Artifact methods
+    # -------------------------------------------------------------------------
+
+    async def load_artifact(self, name: str) -> Any:
+        store = self._storage.get_artifact_store()
+        return store.load(name)
+
+    async def save_artifact(self, name: str, data: Any, description: str) -> dict[str, Any]:
+        store = self._storage.get_artifact_store()
+        artifact = store.save(name, data, description=description)
+        return {
+            "name": artifact.name,
+            "path": artifact.path,
+            "description": artifact.description,
+            "created_at": artifact.created_at.isoformat(),
+        }
+
+    async def list_artifacts(self) -> list[dict[str, Any]]:
+        store = self._storage.get_artifact_store()
+        artifacts = store.list()
+        return [
+            {
+                "name": a.name,
+                "path": a.path,
+                "description": a.description,
+                "created_at": a.created_at.isoformat(),
+            }
+            for a in artifacts
+        ]
+
+    async def delete_artifact(self, name: str) -> None:
+        store = self._storage.get_artifact_store()
+        store.delete(name)
+
+    async def artifact_exists(self, name: str) -> bool:
+        store = self._storage.get_artifact_store()
+        return store.exists(name)
+
+    async def get_artifact(self, name: str) -> dict[str, Any] | None:
+        store = self._storage.get_artifact_store()
+        artifact = store.get(name)
+        if artifact is None:
+            return None
+        return {
+            "name": artifact.name,
+            "path": artifact.path,
+            "description": artifact.description,
+            "created_at": artifact.created_at.isoformat(),
+        }
+
+    # -------------------------------------------------------------------------
+    # Deps methods (host-side persistence + optional venv install hook)
+    # -------------------------------------------------------------------------
+
+    async def add_dep(self, package: str) -> dict[str, Any]:
+        if not self._allow_runtime_deps:
+            raise RuntimeError(
+                "RuntimeDepsDisabledError: Runtime dependency installation is disabled. "
+                "Dependencies must be pre-configured before session start."
+            )
+
+        if self._deps_store is not None:
+            self._deps_store.add(package)
+
+        # SubprocessExecutor path: also install into venv if available.
+        if self._venv_manager is not None and self._venv is not None:
+            try:
+                await self._venv_manager.add_package(self._venv, package)
+                return {"installed": [package], "already_present": [], "failed": []}
+            except Exception as e:
+                logger.warning("Failed to install %s: %s", package, e)
+                return {"installed": [], "already_present": [], "failed": [package]}
+
+        return {"installed": [package], "already_present": [], "failed": []}
+
+    async def remove_dep(self, package: str) -> bool:
+        if not self._allow_runtime_deps:
+            raise RuntimeError(
+                "RuntimeDepsDisabledError: Runtime dependency modification is disabled. "
+                "Dependencies must be pre-configured before session start."
+            )
+
+        if self._deps_store is None:
+            return False
+        return self._deps_store.remove(package)
+
+    async def list_deps(self) -> list[str]:
+        if self._deps_store is None:
+            return []
+        return self._deps_store.list()
+
+    async def sync_deps(self) -> dict[str, Any]:
+        if self._deps_store is None:
+            return {"installed": [], "already_present": [], "failed": []}
+
+        packages = self._deps_store.list()
+        if not packages:
+            return {"installed": [], "already_present": [], "failed": []}
+
+        if self._venv_manager is None or self._venv is None:
+            return {"installed": packages, "already_present": [], "failed": []}
+
+        installed: list[str] = []
+        failed: list[str] = []
+        for pkg in packages:
+            try:
+                await self._venv_manager.add_package(self._venv, pkg)
+                installed.append(pkg)
+            except Exception as e:
+                logger.warning("Failed to install %s: %s", pkg, e)
+                failed.append(pkg)
+
+        return {"installed": installed, "already_present": [], "failed": failed}
diff --git a/src/py_code_mode/execution/subprocess/executor.py b/src/py_code_mode/execution/subprocess/executor.py
index f3c234d..aaad9d2 100644
--- a/src/py_code_mode/execution/subprocess/executor.py
+++ b/src/py_code_mode/execution/subprocess/executor.py
@@ -31,6 +31,7 @@
     validate_storage_not_access,
 )
 from py_code_mode.execution.registry import register_backend
+from py_code_mode.execution.resource_provider import StorageResourceProvider
 from py_code_mode.execution.subprocess.config import SubprocessConfig
 from py_code_mode.execution.subprocess.host import KernelHost
 from py_code_mode.execution.subprocess.venv import KernelVenv, VenvManager
@@ -64,324 +65,6 @@ def _deserialize_value(text_repr: str | None) -> Any:
         return text_repr
 
 
-class StorageResourceProvider:
-    """ResourceProvider that bridges RPC to storage backend.
-
-    This class implements the ResourceProvider protocol by delegating
-    to the storage backend for workflows and artifacts, and using
-    executor-provided tool registry and deps store.
-    """
-
-    def __init__(
-        self,
-        storage: StorageBackend,
-        tool_registry: ToolRegistry | None = None,
-        deps_store: DepsStore | None = None,
-        allow_runtime_deps: bool = True,
-        venv_manager: VenvManager | None = None,
-        venv: KernelVenv | None = None,
-    ) -> None:
-        """Initialize provider.
-
-        Args:
-            storage: Storage backend for workflows and artifacts.
-            tool_registry: Tool registry loaded from executor config.
-            deps_store: Deps store for dependency management.
-            allow_runtime_deps: Whether to allow deps.add() and deps.remove().
-            venv_manager: VenvManager for package installation.
-            venv: KernelVenv for the current subprocess.
-        """
-        self._storage = storage
-        self._tool_registry = tool_registry
-        self._deps_store = deps_store
-        self._allow_runtime_deps = allow_runtime_deps
-        self._venv_manager = venv_manager
-        self._venv = venv
-        # Cached workflow library (lazy initialized)
-        self._workflow_library = None
-
-    def _get_tool_registry(self) -> ToolRegistry | None:
-        """Get tool registry. Already loaded at construction time."""
-        return self._tool_registry
-
-    def _get_workflow_library(self):
-        """Get workflow library, caching the result."""
-        if self._workflow_library is None:
-            self._workflow_library = self._storage.get_workflow_library()
-        return self._workflow_library
-
-    # -------------------------------------------------------------------------
-    # Tool methods
-    # -------------------------------------------------------------------------
-
-    async def call_tool(self, name: str, args: dict[str, Any]) -> Any:
-        """Call a tool by name with given arguments.
-
-        Supports both:
-        - Direct tool invocation: name="curl", args={...}
-        - Recipe invocation: name="curl.get", args={...}
-        """
-        registry = self._get_tool_registry()
-        if registry is None:
-            raise ValueError("No tools configured")
-
-        # Parse name for recipe syntax (e.g., "curl.get")
-        if "." in name:
-            tool_name, recipe_name = name.split(".", 1)
-        else:
-            tool_name = name
-            recipe_name = None
-
-        # Find the tool's adapter
-        adapter = registry.find_adapter_for_tool(tool_name)
-        if adapter is None:
-            raise ValueError(f"Unknown tool: {tool_name}")
-
-        # Call the tool
-        return await adapter.call_tool(tool_name, recipe_name, args)
-
-    async def list_tools(self) -> list[dict[str, Any]]:
-        """List all available tools."""
-        registry = self._get_tool_registry()
-        if registry is None:
-            return []
-        return [tool.to_dict() for tool in registry.list_tools()]
-
-    async def search_tools(self, query: str, limit: int) -> list[dict[str, Any]]:
-        """Search tools by query."""
-        registry = self._get_tool_registry()
-        if registry is None:
-            return []
-        return [tool.to_dict() for tool in registry.search(query, limit=limit)]
-
-    async def list_tool_recipes(self, name: str) -> list[dict[str, Any]]:
-        """List recipes for a specific tool."""
-        registry = self._get_tool_registry()
-        if registry is None:
-            raise ValueError("No tools configured")
-        all_tools = registry.get_all_tools()
-        tool = next((t for t in all_tools if t.name == name), None)
-        if tool is None:
-            raise ValueError(f"Unknown tool: {name}")
-
-        return [
-            {
-                "name": c.name,
-                "description": c.description or "",
-            }
-            for c in tool.callables
-        ]
-
-    # -------------------------------------------------------------------------
-    # Workflow methods
-    # -------------------------------------------------------------------------
-
-    async def search_workflows(self, query: str, limit: int) -> list[dict[str, Any]]:
-        """Search for workflows matching query."""
-        library = self._get_workflow_library()
-        library.refresh()
-        workflows = library.search(query, limit=limit)
-        return [
-            {
-                "name": w.name,
-                "description": w.description,
-                "params": {p.name: p.description or p.type for p in w.parameters},
-            }
-            for w in workflows
-        ]
-
-    async def list_workflows(self) -> list[dict[str, Any]]:
-        """List all available workflows."""
-        library = self._get_workflow_library()
-        library.refresh()
-        workflows = library.list()
-        return [
-            {
-                "name": w.name,
-                "description": w.description,
-                "params": {p.name: p.description or p.type for p in w.parameters},
-            }
-            for w in workflows
-        ]
-
-    async def get_workflow(self, name: str) -> dict[str, Any] | None:
-        """Get a workflow by name."""
-        library = self._get_workflow_library()
-        library.refresh()
-        workflow = library.get(name)
-        if workflow is None:
-            return None
-        return {
-            "name": workflow.name,
-            "description": workflow.description,
-            "source": workflow.source,
-            "params": {p.name: p.description or p.type for p in workflow.parameters},
-        }
-
-    async def create_workflow(self, name: str, source: str, description: str) -> dict[str, Any]:
-        """Create and save a new workflow."""
-        from py_code_mode.workflows import PythonWorkflow
-
-        workflow = PythonWorkflow.from_source(
-            name=name,
-            source=source,
-            description=description,
-        )
-
-        library = self._get_workflow_library()
-        library.add(workflow)
-
-        return {
-            "name": workflow.name,
-            "description": workflow.description,
-            "params": {p.name: p.description or p.type for p in workflow.parameters},
-        }
-
-    async def delete_workflow(self, name: str) -> bool:
-        """Delete a workflow."""
-        library = self._get_workflow_library()
-        return library.remove(name)
-
-    # -------------------------------------------------------------------------
-    # Artifact methods
-    # -------------------------------------------------------------------------
-
-    async def load_artifact(self, name: str) -> Any:
-        """Load an artifact by name."""
-        store = self._storage.get_artifact_store()
-        return store.load(name)
-
-    async def save_artifact(self, name: str, data: Any, description: str) -> dict[str, Any]:
-        """Save an artifact."""
-        store = self._storage.get_artifact_store()
-        artifact = store.save(name, data, description=description)
-        return {
-            "name": artifact.name,
-            "path": artifact.path,
-            "description": artifact.description,
-            "created_at": artifact.created_at.isoformat(),
-        }
-
-    async def list_artifacts(self) -> list[dict[str, Any]]:
-        """List all artifacts."""
-        store = self._storage.get_artifact_store()
-        artifacts = store.list()
-        return [
-            {
-                "name": a.name,
-                "path": a.path,
-                "description": a.description,
-                "created_at": a.created_at.isoformat(),
-            }
-            for a in artifacts
-        ]
-
-    async def delete_artifact(self, name: str) -> None:
-        """Delete an artifact."""
-        store = self._storage.get_artifact_store()
-        store.delete(name)
-
-    async def artifact_exists(self, name: str) -> bool:
-        """Check if an artifact exists."""
-        store = self._storage.get_artifact_store()
-        return store.exists(name)
-
-    async def get_artifact(self, name: str) -> dict[str, Any] | None:
-        """Get artifact metadata."""
-        store = self._storage.get_artifact_store()
-        artifact = store.get(name)
-        if artifact is None:
-            return None
-        return {
-            "name": artifact.name,
-            "path": artifact.path,
-            "description": artifact.description,
-            "created_at": artifact.created_at.isoformat(),
-        }
-
-    # -------------------------------------------------------------------------
-    # Deps methods
-    # -------------------------------------------------------------------------
-
-    async def add_dep(self, package: str) -> dict[str, Any]:
-        """Add and install a package.
-
-        When allow_runtime_deps=False, raises RuntimeError.
-        """
-        if not self._allow_runtime_deps:
-            raise RuntimeError(
-                "RuntimeDepsDisabledError: Runtime dependency installation is disabled. "
-                "Dependencies must be pre-configured before session start."
-            )
-
-        # Add to deps store if configured
-        if self._deps_store is not None:
-            self._deps_store.add(package)
-
-        # Install via venv manager if available
-        if self._venv_manager is not None and self._venv is not None:
-            try:
-                await self._venv_manager.add_package(self._venv, package)
-                return {"installed": [package], "already_present": [], "failed": []}
-            except Exception as e:
-                logger.warning("Failed to install %s: %s", package, e)
-                return {"installed": [], "already_present": [], "failed": [package]}
-        else:
-            # No venv manager - just report what we would install
-            return {"installed": [package], "already_present": [], "failed": []}
-
-    async def remove_dep(self, package: str) -> bool:
-        """Remove a package from configuration.
-
-        When allow_runtime_deps=False, raises RuntimeError.
-        """
-        if not self._allow_runtime_deps:
-            raise RuntimeError(
-                "RuntimeDepsDisabledError: Runtime dependency modification is disabled. "
-                "Dependencies must be pre-configured before session start."
-            )
-
-        if self._deps_store is None:
-            return False
-        return self._deps_store.remove(package)
-
-    async def list_deps(self) -> list[str]:
-        """List configured packages."""
-        if self._deps_store is None:
-            return []
-        return self._deps_store.list()
-
-    async def sync_deps(self) -> dict[str, Any]:
-        """Install all configured packages.
-
-        This is always allowed, even when allow_runtime_deps=False,
-        because it only installs pre-configured packages.
-        """
-        if self._deps_store is None:
-            return {"installed": [], "already_present": [], "failed": []}
-
-        packages = self._deps_store.list()
-
-        if not packages:
-            return {"installed": [], "already_present": [], "failed": []}
-
-        if self._venv_manager is None or self._venv is None:
-            return {"installed": packages, "already_present": [], "failed": []}
-
-        installed: list[str] = []
-        failed: list[str] = []
-
-        for pkg in packages:
-            try:
-                await self._venv_manager.add_package(self._venv, pkg)
-                installed.append(pkg)
-            except Exception as e:
-                logger.warning("Failed to install %s: %s", pkg, e)
-                failed.append(pkg)
-
-        return {"installed": installed, "already_present": [], "failed": failed}
-
-
 class SubprocessExecutor:
     """Execute code in an isolated subprocess with its own venv and IPython kernel.
 
diff --git a/src/py_code_mode/execution/subprocess/kernel_init.py b/src/py_code_mode/execution/subprocess/kernel_init.py
index c74b14f..327b3a8 100644
--- a/src/py_code_mode/execution/subprocess/kernel_init.py
+++ b/src/py_code_mode/execution/subprocess/kernel_init.py
@@ -27,6 +27,7 @@ def get_kernel_init_code(ipc_timeout: float | None = None) -> str:
 from __future__ import annotations
 
 import json
+import asyncio
 import threading
 import uuid
 from typing import Any, NamedTuple
@@ -51,6 +52,23 @@ def _namespace_error_handler(self, etype, value, tb, tb_offset=None):
 # Threading lock to prevent concurrent RPC corruption
 _rpc_lock = threading.Lock()
 
+# Async lock to prevent concurrent RPC corruption when used with await/to_thread
+_rpc_async_lock = asyncio.Lock()
+
+
+def _in_async_context() -> bool:
+    # IPython / ipykernel runs an event loop even for "sync" code execution,
+    # so using get_running_loop() here would force the entire sandbox surface
+    # to return coroutine objects and break existing agent code.
+    #
+    # SubprocessExecutor's agent-facing namespaces are intentionally synchronous.
+    return False
+
+
+async def _rpc_call_async(method: str, **kwargs) -> Any:
+    async with _rpc_async_lock:
+        return await asyncio.to_thread(_rpc_call, method, **kwargs)
+
 # Configurable timeout for RPC calls
 _RPC_TIMEOUT = {ipc_timeout}
 
@@ -307,7 +325,12 @@ def __init__(self, tool_name: str, recipe_name: str):
 
     def __call__(self, **kwargs) -> Any:
         """Invoke the recipe with given arguments."""
-        # Recipe invocation: name is "tool.recipe"
+        if _in_async_context():
+            return _rpc_call_async(
+                "tools.call",
+                name=f"{{self._tool_name}}.{{self._recipe_name}}",
+                args=kwargs,
+            )
         return _rpc_call(
             "tools.call",
             name=f"{{self._tool_name}}.{{self._recipe_name}}",
@@ -324,6 +347,8 @@ def __init__(self, name: str, validated: bool = False):
 
     def __call__(self, **kwargs) -> Any:
         """Direct tool invocation (escape hatch)."""
+        if _in_async_context():
+            return _rpc_call_async("tools.call", name=self._name, args=kwargs)
         return _rpc_call("tools.call", name=self._name, args=kwargs)
 
     def __getattr__(self, recipe_name: str) -> _ToolRecipeProxy:
@@ -334,6 +359,8 @@ def __getattr__(self, recipe_name: str) -> _ToolRecipeProxy:
 
     def list(self) -> list[dict[str, Any]]:
         """List recipes for this tool."""
+        if _in_async_context():
+            return _rpc_call_async("tools.list_recipes", name=self._name)
         return _rpc_call("tools.list_recipes", name=self._name)
 
 
@@ -388,7 +415,8 @@ def list(self) -> list[dict[str, Any]]:
         Returns:
             List of dicts with name, description, and tags keys.
         """
-        # Return raw dicts (not NamedTuples) so they serialize cleanly through IPython
+        if _in_async_context():
+            return _rpc_call_async("tools.list")
         return _rpc_call("tools.list")
 
     def search(self, query: str, limit: int = 10) -> list[dict[str, Any]]:
@@ -397,7 +425,8 @@ def search(self, query: str, limit: int = 10) -> list[dict[str, Any]]:
         Returns:
             List of dicts matching the query.
         """
-        # Return raw dicts (not NamedTuples) so they serialize cleanly through IPython
+        if _in_async_context():
+            return _rpc_call_async("tools.search", query=query, limit=limit)
         return _rpc_call("tools.search", query=query, limit=limit)
 
 
@@ -418,7 +447,8 @@ def invoke(self, workflow_name: str, **kwargs) -> Any:
 
         Gets workflow source from host and executes it locally in the kernel.
         This ensures workflows can import packages installed at runtime.
-        Handles async workflows by running them with asyncio.run().
+        Handles async workflows by running them to completion in the kernel's
+        event loop (ipykernel runs a loop even for "sync" execution).
 
         Args:
             workflow_name: Name of the workflow to invoke.
@@ -427,7 +457,35 @@ def invoke(self, workflow_name: str, **kwargs) -> Any:
         Note: Uses workflow_name (not name) to avoid collision with workflows
         that have a 'name' parameter.
         """
-        import asyncio
+        if _in_async_context():
+            async def _coro() -> Any:
+                workflow = await _rpc_call_async("workflows.get", name=workflow_name)
+                if workflow is None:
+                    raise ValueError(f"Workflow not found: {{workflow_name}}")
+
+                source = workflow.get("source")
+                if not source:
+                    raise ValueError(f"Workflow has no source: {{workflow_name}}")
+
+                workflow_namespace = {{
+                    "tools": tools,
+                    "workflows": workflows,
+                    "artifacts": artifacts,
+                    "deps": deps,
+                }}
+                code = compile(source, f"<workflow:{{workflow_name}}>", "exec")
+                exec(code, workflow_namespace)
+
+                run_func = workflow_namespace.get("run")
+                if not callable(run_func):
+                    raise ValueError(f"Workflow {{workflow_name}} has no run() function")
+
+                result = run_func(**kwargs)
+                if asyncio.iscoroutine(result):
+                    return await result
+                return result
+
+            return _coro()
 
         workflow = _rpc_call("workflows.get", name=workflow_name)
         if workflow is None:
@@ -452,18 +510,13 @@ def invoke(self, workflow_name: str, **kwargs) -> Any:
 
         result = run_func(**kwargs)
         if asyncio.iscoroutine(result):
-            try:
-                asyncio.get_running_loop()
-                has_loop = True
-            except RuntimeError:
-                has_loop = False
-
-            if has_loop:
-                import concurrent.futures
-                with concurrent.futures.ThreadPoolExecutor() as pool:
-                    future = pool.submit(asyncio.run, result)
-                    return future.result()
-            return asyncio.run(result)
+            # ipykernel runs an event loop already, so asyncio.run() is not valid.
+            # Use nest_asyncio to allow re-entrant run_until_complete.
+            import nest_asyncio
+
+            nest_asyncio.apply()
+            loop = asyncio.get_event_loop()
+            return loop.run_until_complete(result)
         return result
 
     def search(self, query: str, limit: int = 5) -> list[Workflow]:
@@ -472,15 +525,25 @@ def search(self, query: str, limit: int = 5) -> list[Workflow]:
         Returns:
             List of Workflow objects matching the query.
         """
+        def _convert(result: list[dict[str, Any]]) -> list[Workflow]:
+            return [
+                Workflow(
+                    name=s["name"],
+                    description=s.get("description", ""),
+                    params=s.get("params", {{}}),
+                )
+                for s in result
+            ]
+
+        if _in_async_context():
+            async def _coro() -> list[Workflow]:
+                result = await _rpc_call_async("workflows.search", query=query, limit=limit)
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("workflows.search", query=query, limit=limit)
-        return [
-            Workflow(
-                name=s["name"],
-                description=s.get("description", ""),
-                params=s.get("params", {{}}),
-            )
-            for s in result
-        ]
+        return _convert(result)
 
     def list(self) -> list[Workflow]:
         """List all available workflows.
@@ -488,21 +551,33 @@ def list(self) -> list[Workflow]:
         Returns:
             List of Workflow objects.
         """
+        def _convert(result: list[dict[str, Any]]) -> list[Workflow]:
+            return [
+                Workflow(
+                    name=s["name"],
+                    description=s.get("description", ""),
+                    params=s.get("params", {{}}),
+                )
+                for s in result
+            ]
+
+        if _in_async_context():
+            async def _coro() -> list[Workflow]:
+                result = await _rpc_call_async("workflows.list")
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("workflows.list")
-        return [
-            Workflow(
-                name=s["name"],
-                description=s.get("description", ""),
-                params=s.get("params", {{}}),
-            )
-            for s in result
-        ]
+        return _convert(result)
 
     def get(self, name: str) -> dict[str, Any] | None:
         """Get a workflow by name.
 
         Returns full workflow details including source.
         """
+        if _in_async_context():
+            return _rpc_call_async("workflows.get", name=name)
         return _rpc_call("workflows.get", name=name)
 
     def create(self, name: str, source: str, description: str = "") -> Workflow:
@@ -511,6 +586,19 @@ def create(self, name: str, source: str, description: str = "") -> Workflow:
         Returns:
             Workflow object for the created workflow.
         """
+        if _in_async_context():
+            async def _coro() -> Workflow:
+                result = await _rpc_call_async(
+                    "workflows.create", name=name, source=source, description=description
+                )
+                return Workflow(
+                    name=result["name"],
+                    description=result.get("description", ""),
+                    params=result.get("params", {{}}),
+                )
+
+            return _coro()
+
         result = _rpc_call("workflows.create", name=name, source=source, description=description)
         return Workflow(
             name=result["name"],
@@ -520,6 +608,8 @@ def create(self, name: str, source: str, description: str = "") -> Workflow:
 
     def delete(self, name: str) -> bool:
         """Delete a workflow."""
+        if _in_async_context():
+            return _rpc_call_async("workflows.delete", name=name)
         return _rpc_call("workflows.delete", name=name)
 
     def __getattr__(self, name: str) -> Any:
@@ -543,6 +633,8 @@ class ArtifactsProxy:
 
     def load(self, name: str) -> Any:
         """Load an artifact by name."""
+        if _in_async_context():
+            return _rpc_call_async("artifacts.load", name=name)
         return _rpc_call("artifacts.load", name=name)
 
     def save(self, name: str, data: Any, description: str = "") -> ArtifactMeta:
@@ -551,13 +643,25 @@ def save(self, name: str, data: Any, description: str = "") -> ArtifactMeta:
         Returns:
             ArtifactMeta with name, path, description, created_at.
         """
+        def _convert(result: dict[str, Any]) -> ArtifactMeta:
+            return ArtifactMeta(
+                name=result["name"],
+                path=result.get("path", ""),
+                description=result.get("description", ""),
+                created_at=result.get("created_at", ""),
+            )
+
+        if _in_async_context():
+            async def _coro() -> ArtifactMeta:
+                result = await _rpc_call_async(
+                    "artifacts.save", name=name, data=data, description=description
+                )
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("artifacts.save", name=name, data=data, description=description)
-        return ArtifactMeta(
-            name=result["name"],
-            path=result.get("path", ""),
-            description=result.get("description", ""),
-            created_at=result.get("created_at", ""),
-        )
+        return _convert(result)
 
     def list(self) -> list[ArtifactMeta]:
         """List all artifacts.
@@ -565,36 +669,60 @@ def list(self) -> list[ArtifactMeta]:
         Returns:
             List of ArtifactMeta objects.
         """
+        def _convert(result: list[dict[str, Any]]) -> list[ArtifactMeta]:
+            return [
+                ArtifactMeta(
+                    name=a["name"],
+                    path=a.get("path", ""),
+                    description=a.get("description", ""),
+                    created_at=a.get("created_at", ""),
+                )
+                for a in result
+            ]
+
+        if _in_async_context():
+            async def _coro() -> list[ArtifactMeta]:
+                result = await _rpc_call_async("artifacts.list")
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("artifacts.list")
-        return [
-            ArtifactMeta(
-                name=a["name"],
-                path=a.get("path", ""),
-                description=a.get("description", ""),
-                created_at=a.get("created_at", ""),
-            )
-            for a in result
-        ]
+        return _convert(result)
 
     def delete(self, name: str) -> None:
         """Delete an artifact."""
+        if _in_async_context():
+            return _rpc_call_async("artifacts.delete", name=name)
         return _rpc_call("artifacts.delete", name=name)
 
     def exists(self, name: str) -> bool:
         """Check if an artifact exists."""
+        if _in_async_context():
+            return _rpc_call_async("artifacts.exists", name=name)
         return _rpc_call("artifacts.exists", name=name)
 
     def get(self, name: str) -> ArtifactMeta | None:
         """Get artifact metadata."""
+        def _convert(result: dict[str, Any] | None) -> ArtifactMeta | None:
+            if result is None:
+                return None
+            return ArtifactMeta(
+                name=result["name"],
+                path=result.get("path", ""),
+                description=result.get("description", ""),
+                created_at=result.get("created_at", ""),
+            )
+
+        if _in_async_context():
+            async def _coro() -> ArtifactMeta | None:
+                result = await _rpc_call_async("artifacts.get", name=name)
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("artifacts.get", name=name)
-        if result is None:
-            return None
-        return ArtifactMeta(
-            name=result["name"],
-            path=result.get("path", ""),
-            description=result.get("description", ""),
-            created_at=result.get("created_at", ""),
-        )
+        return _convert(result)
 
 
 class DepsProxy:
@@ -616,19 +744,33 @@ def add(self, package: str) -> SyncResult:
         Returns:
             SyncResult with installed, already_present, and failed tuples.
         """
+        def _convert(result: dict[str, Any]) -> SyncResult:
+            return SyncResult(
+                installed=tuple(result.get("installed", [])),
+                already_present=tuple(result.get("already_present", [])),
+                failed=tuple(result.get("failed", [])),
+            )
+
+        if _in_async_context():
+            async def _coro() -> SyncResult:
+                result = await _rpc_call_async("deps.add", package=package)
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("deps.add", package=package)
-        return SyncResult(
-            installed=tuple(result.get("installed", [])),
-            already_present=tuple(result.get("already_present", [])),
-            failed=tuple(result.get("failed", [])),
-        )
+        return _convert(result)
 
     def remove(self, package: str) -> bool:
         """Remove a package from configuration."""
+        if _in_async_context():
+            return _rpc_call_async("deps.remove", package=package)
         return _rpc_call("deps.remove", package=package)
 
     def list(self) -> list[str]:
         """List configured packages."""
+        if _in_async_context():
+            return _rpc_call_async("deps.list")
         return _rpc_call("deps.list")
 
     def sync(self) -> SyncResult:
@@ -637,12 +779,22 @@ def sync(self) -> SyncResult:
         Returns:
             SyncResult with installed, already_present, and failed tuples.
         """
+        def _convert(result: dict[str, Any]) -> SyncResult:
+            return SyncResult(
+                installed=tuple(result.get("installed", [])),
+                already_present=tuple(result.get("already_present", [])),
+                failed=tuple(result.get("failed", [])),
+            )
+
+        if _in_async_context():
+            async def _coro() -> SyncResult:
+                result = await _rpc_call_async("deps.sync")
+                return _convert(result)
+
+            return _coro()
+
         result = _rpc_call("deps.sync")
-        return SyncResult(
-            installed=tuple(result.get("installed", [])),
-            already_present=tuple(result.get("already_present", [])),
-            failed=tuple(result.get("failed", [])),
-        )
+        return _convert(result)
 
     def __repr__(self) -> str:
         """String representation showing it's a DepsNamespace."""
diff --git a/src/py_code_mode/tools/__init__.py b/src/py_code_mode/tools/__init__.py
index 07c96fa..b5f4b83 100644
--- a/src/py_code_mode/tools/__init__.py
+++ b/src/py_code_mode/tools/__init__.py
@@ -1,6 +1,7 @@
 """py_code_mode.tools - Tool registry and namespace."""
 
 from py_code_mode.tools.loader import load_tools_from_path
+from py_code_mode.tools.middleware import ToolCallContext, ToolMiddleware
 from py_code_mode.tools.namespace import (
     CallableProxy,
     ToolProxy,
@@ -26,4 +27,6 @@
     "ToolProxy",
     "ToolsNamespace",
     "load_tools_from_path",
+    "ToolCallContext",
+    "ToolMiddleware",
 ]
diff --git a/src/py_code_mode/tools/adapters/__init__.py b/src/py_code_mode/tools/adapters/__init__.py
index 93b836c..e44dbf5 100644
--- a/src/py_code_mode/tools/adapters/__init__.py
+++ b/src/py_code_mode/tools/adapters/__init__.py
@@ -4,6 +4,7 @@
 from py_code_mode.tools.adapters.cli import CLIAdapter
 from py_code_mode.tools.adapters.http import Endpoint, HTTPAdapter
 from py_code_mode.tools.adapters.mcp import MCPAdapter
+from py_code_mode.tools.adapters.middleware import MiddlewareAdapter
 
 __all__ = [
     "ToolAdapter",
@@ -11,4 +12,5 @@
     "MCPAdapter",
     "HTTPAdapter",
     "Endpoint",
+    "MiddlewareAdapter",
 ]
diff --git a/src/py_code_mode/tools/adapters/middleware.py b/src/py_code_mode/tools/adapters/middleware.py
new file mode 100644
index 0000000..9cc1198
--- /dev/null
+++ b/src/py_code_mode/tools/adapters/middleware.py
@@ -0,0 +1,65 @@
+"""ToolAdapter wrapper that applies tool call middleware."""
+
+from __future__ import annotations
+
+import uuid
+from typing import Any
+
+from py_code_mode.tools.adapters.base import ToolAdapter
+from py_code_mode.tools.middleware import ToolCallContext, ToolMiddleware, compose_tool_middlewares
+from py_code_mode.tools.types import Tool
+
+
+class MiddlewareAdapter:
+    """Wrap a ToolAdapter with a middleware chain for call_tool()."""
+
+    def __init__(
+        self,
+        inner: ToolAdapter,
+        middlewares: tuple[ToolMiddleware, ...],
+        *,
+        executor_type: str | None = None,
+        origin: str | None = None,
+    ) -> None:
+        self._inner = inner
+        self._middlewares = middlewares
+        self._executor_type = executor_type
+        self._origin = origin
+
+    @property
+    def inner(self) -> ToolAdapter:
+        return self._inner
+
+    def list_tools(self) -> list[Tool]:
+        return self._inner.list_tools()
+
+    async def describe(self, tool_name: str, callable_name: str) -> dict[str, str]:
+        return await self._inner.describe(tool_name, callable_name)
+
+    async def call_tool(
+        self,
+        name: str,
+        callable_name: str | None,
+        args: dict[str, Any],
+    ) -> Any:
+        if not self._middlewares:
+            return await self._inner.call_tool(name, callable_name, args)
+
+        ctx = ToolCallContext(
+            tool_name=name,
+            callable_name=callable_name,
+            args=args,
+            adapter_name=type(self._inner).__name__,
+            executor_type=self._executor_type,
+            origin=self._origin,
+            request_id=uuid.uuid4().hex,
+        )
+
+        async def _terminal(c: ToolCallContext) -> Any:
+            return await self._inner.call_tool(c.tool_name, c.callable_name, c.args)
+
+        chain = compose_tool_middlewares(self._middlewares, _terminal)
+        return await chain(ctx)
+
+    async def close(self) -> None:
+        await self._inner.close()
diff --git a/src/py_code_mode/tools/middleware.py b/src/py_code_mode/tools/middleware.py
new file mode 100644
index 0000000..fe09d39
--- /dev/null
+++ b/src/py_code_mode/tools/middleware.py
@@ -0,0 +1,72 @@
+"""Tool call middleware and context types.
+
+This layer is designed to be generic: it can be used for audit logging,
+allow/deny decisions, interactive approvals, argument rewriting, retries, etc.
+
+Middleware runs on the host side where tools are executed (CLI/MCP/HTTP).
+"""
+
+from __future__ import annotations
+
+from collections.abc import Awaitable, Callable
+from dataclasses import dataclass
+from typing import Any, Protocol
+
+
+@dataclass
+class ToolCallContext:
+    """Context for a single tool call.
+
+    Notes:
+    - `args` is intentionally mutable to support argument rewriting.
+    - `executor_type` and `origin` are best-effort labels (not security boundaries).
+    """
+
+    tool_name: str
+    callable_name: str | None
+    args: dict[str, Any]
+
+    # Optional metadata for middleware consumers.
+    adapter_name: str | None = None
+    executor_type: str | None = None  # e.g. "deno-sandbox", "subprocess"
+    origin: str | None = None  # e.g. "deno-sandbox", "host"
+    request_id: str | None = None
+    timeout: float | None = None
+
+    @property
+    def full_name(self) -> str:
+        if self.callable_name:
+            return f"{self.tool_name}.{self.callable_name}"
+        return self.tool_name
+
+
+type CallNext = Callable[[ToolCallContext], Awaitable[Any]]
+
+
+class ToolMiddleware(Protocol):
+    async def __call__(self, ctx: ToolCallContext, call_next: CallNext) -> Any: ...
+
+
+def compose_tool_middlewares(
+    middlewares: tuple[ToolMiddleware, ...],
+    terminal: CallNext,
+) -> CallNext:
+    """Compose middlewares around a terminal call.
+
+    Middleware order is outer-to-inner:
+        middlewares[0] wraps middlewares[1] wraps ... wraps terminal
+    """
+
+    call_next = terminal
+    for mw in reversed(middlewares):
+
+        async def _wrapped(
+            ctx: ToolCallContext,
+            _mw: ToolMiddleware = mw,
+            _n: CallNext = call_next,
+        ):
+            return await _mw(ctx, _n)
+
+        call_next = _wrapped
+
+    return call_next
diff --git a/src/py_code_mode/tools/namespace.py b/src/py_code_mode/tools/namespace.py
index a3f8b6f..a43b14a 100644
--- a/src/py_code_mode/tools/namespace.py
+++ b/src/py_code_mode/tools/namespace.py
@@ -4,6 +4,7 @@
 
 import asyncio
 import builtins
+import threading
 from typing import TYPE_CHECKING, Any
 
 from py_code_mode.tools.types import Tool, ToolCallable
@@ -35,7 +36,11 @@ def __init__(self, registry: ToolRegistry) -> None:
         self._loop: asyncio.AbstractEventLoop | None = None
 
     def set_loop(self, loop: asyncio.AbstractEventLoop) -> None:
-        """Set the event loop to use for async tool calls."""
+        """Set the event loop used by sync calls made from worker threads.
+
+        InProcessExecutor executes user code in a worker thread. Tool adapters are
+        async, so sync tool calls use run_coroutine_threadsafe against this loop.
+        """
         self._loop = loop
 
     def __getattr__(self, tool_name: str) -> ToolProxy:
@@ -94,10 +99,7 @@ def __init__(
     async def _execute(self, **kwargs: Any) -> Any:
         """Execute the tool asynchronously."""
         tool_name = self._tool.name
-        adapter = self._registry.find_adapter_for_tool(tool_name)
-        if adapter is None:
-            raise RuntimeError(f"No adapter found for tool: {tool_name}")
-        return await adapter.call_tool(tool_name, None, kwargs)
+        return await self._registry.call_tool(tool_name, None, kwargs)
 
     async def call_async(self, **kwargs: Any) -> Any:
         """Execute tool asynchronously. Always returns awaitable.
@@ -113,37 +115,42 @@ def call_sync(self, **kwargs: Any) -> Any:
         """
         coro = self._execute(**kwargs)
 
-        # When called from a thread with loop reference, use run_coroutine_threadsafe
+        # When called from a worker thread, schedule onto the main loop.
         if self._loop is not None:
             future = asyncio.run_coroutine_threadsafe(coro, self._loop)
             return future.result()
 
-        # Standalone sync usage - create new loop
-        return asyncio.run(coro)
+        # If we're already inside an event loop on this thread, we cannot call
+        # asyncio.run(). For sync ergonomics (tools.x.y()), execute the coroutine
+        # in a dedicated thread with its own loop and block for completion.
+        try:
+            asyncio.get_running_loop()
+        except RuntimeError:
+            return asyncio.run(coro)
+
+        out: dict[str, Any] = {}
+        err: list[BaseException] = []
+
+        def _runner() -> None:
+            try:
+                out["value"] = asyncio.run(coro)
+            except BaseException as e:  # propagate exception across threads
+                err.append(e)
+
+        t = threading.Thread(target=_runner, daemon=True)
+        t.start()
+        t.join()
+        if err:
+            raise err[0]
+        return out.get("value")
 
     def __call__(self, **kwargs: Any) -> Any:
         """Escape hatch - invoke tool directly without recipe.
 
-        This delegates to the adapter's call_tool method, bypassing recipes.
-        Returns coroutine in async context, executes sync otherwise.
-
-        When set_loop() has been called, always uses sync execution to support
-        calling tools from within synchronously-executed workflows.
+        Tool calls are synchronous in the agent-facing namespace. The underlying
+        adapter is async, so this blocks until completion.
         """
-        # If we have an explicit loop reference, always use sync path
-        # This supports calling tools from sync workflow code within async context
-        if self._loop is not None:
-            return self.call_sync(**kwargs)
-
-        # Check if we're in async context (has running loop)
-        try:
-            asyncio.get_running_loop()
-        except RuntimeError:
-            # No event loop running - use sync path
-            return self.call_sync(**kwargs)
-        else:
-            # In async context - return coroutine for await
-            return self._execute(**kwargs)
+        return self.call_sync(**kwargs)
 
     def __getattr__(self, callable_name: str) -> CallableProxy:
         """Get a callable proxy by name."""
@@ -178,10 +185,7 @@ def __init__(
 
     async def _execute(self, **kwargs: Any) -> Any:
         """Execute the callable asynchronously."""
-        adapter = self._registry.find_adapter_for_tool(self._tool_name)
-        if adapter is None:
-            raise RuntimeError(f"No adapter found for tool: {self._tool_name}")
-        return await adapter.call_tool(self._tool_name, self._callable.name, kwargs)
+        return await self._registry.call_tool(self._tool_name, self._callable.name, kwargs)
 
     async def call_async(self, **kwargs: Any) -> Any:
         """Execute callable asynchronously. Always returns awaitable.
@@ -197,37 +201,39 @@ def call_sync(self, **kwargs: Any) -> Any:
         """
         coro = self._execute(**kwargs)
 
-        # When called from a thread with loop reference, use run_coroutine_threadsafe
+        # When called from a worker thread, schedule onto the main loop.
         if self._loop is not None:
             future = asyncio.run_coroutine_threadsafe(coro, self._loop)
             return future.result()
 
-        # Standalone sync usage - create new loop
-        return asyncio.run(coro)
+        try:
+            asyncio.get_running_loop()
+        except RuntimeError:
+            return asyncio.run(coro)
+
+        out: dict[str, Any] = {}
+        err: list[BaseException] = []
+
+        def _runner() -> None:
+            try:
+                out["value"] = asyncio.run(coro)
+            except BaseException as e:
+                err.append(e)
+
+        t = threading.Thread(target=_runner, daemon=True)
+        t.start()
+        t.join()
+        if err:
+            raise err[0]
+        return out.get("value")
 
     def __call__(self, **kwargs: Any) -> Any:
         """Invoke the callable with the given arguments.
 
-        Returns a coroutine if called from async context, executes sync otherwise.
-        This allows both `await tools.x.y()` and `tools.x.y()` to work.
-
-        When set_loop() has been called on the parent namespace, always uses
-        sync execution to support calling tools from within synchronously-executed workflows.
+        Callables are synchronous in the agent-facing namespace. The underlying
+        adapter is async, so this blocks until completion.
         """
-        # If we have an explicit loop reference, always use sync path
-        # This supports calling tools from sync workflow code within async context
-        if self._loop is not None:
-            return self.call_sync(**kwargs)
-
-        # Check if we're in async context (has running loop)
-        try:
-            asyncio.get_running_loop()
-        except RuntimeError:
-            # No event loop running - use sync path
-            return self.call_sync(**kwargs)
-        else:
-            # In async context - return coroutine for await
-            return self._execute(**kwargs)
+        return self.call_sync(**kwargs)
 
     async def describe(self) -> dict[str, str]:
         """Get parameter descriptions for this callable."""
diff --git a/src/py_code_mode/tools/registry.py b/src/py_code_mode/tools/registry.py
index b726fe6..b6ab258 100644
--- a/src/py_code_mode/tools/registry.py
+++ b/src/py_code_mode/tools/registry.py
@@ -3,11 +3,12 @@
 from __future__ import annotations
 
 import logging
-from collections.abc import Callable
+from collections.abc import Callable, Sequence
 from typing import TYPE_CHECKING, Any, TypeVar
 
 from py_code_mode.errors import CodeModeError, ToolCallError, ToolNotFoundError
 from py_code_mode.tools.adapters.base import ToolAdapter
+from py_code_mode.tools.middleware import ToolMiddleware
 from py_code_mode.tools.types import Tool
 from py_code_mode.workflows import EmbeddingProvider, cosine_similarity
 
@@ -152,6 +153,32 @@ def __init__(
         self._tools: dict[str, Tool] = {}  # name -> Tool
         self._tool_to_adapter: dict[str, ToolAdapter] = {}  # name -> adapter
         self._vectors: dict[str, list[float]] = {}  # name -> embedding vector
+        self._tool_middlewares: tuple[ToolMiddleware, ...] = ()
+        self._tool_middleware_executor_type: str | None = None
+        self._tool_middleware_origin: str | None = None
+
+    def _unwrap_adapter(self, adapter: ToolAdapter) -> ToolAdapter:
+        # Local import to avoid mandatory dependency on middleware wrapper.
+        from py_code_mode.tools.adapters.middleware import MiddlewareAdapter
+
+        while isinstance(adapter, MiddlewareAdapter):
+            adapter = adapter.inner
+        return adapter
+
+    def _wrap_adapter_if_needed(self, adapter: ToolAdapter) -> ToolAdapter:
+        if not self._tool_middlewares:
+            return adapter
+
+        from py_code_mode.tools.adapters.middleware import MiddlewareAdapter
+
+        # Avoid stacking wrappers.
+        adapter = self._unwrap_adapter(adapter)
+        return MiddlewareAdapter(
+            adapter,
+            self._tool_middlewares,
+            executor_type=self._tool_middleware_executor_type,
+            origin=self._tool_middleware_origin,
+        )
 
     @classmethod
     async def from_dir(
@@ -252,7 +279,7 @@ def add_adapter(self, adapter: ToolAdapter) -> None:
         Args:
             adapter: The adapter to add.
         """
-        self._adapters.append(adapter)
+        self._adapters.append(self._wrap_adapter_if_needed(adapter))
 
     def get_adapters(self) -> list[ToolAdapter]:
         """Get all registered adapters.
@@ -308,6 +335,7 @@ def register_adapter(
         Raises:
             ValueError: If a tool name conflicts with an existing tool.
         """
+        adapter = self._wrap_adapter_if_needed(adapter)
         self._adapters.append(adapter)
         adapter_tools = adapter.list_tools()
         registered = []
@@ -396,10 +424,16 @@ async def call_tool(
             ToolNotFoundError: If tool not found.
             ToolCallError: If tool execution fails.
         """
-        if name not in self._tools:
-            raise ToolNotFoundError(name, list(self._tools.keys()))
+        # Normal path: tools registered via register_adapter()
+        adapter = self._tool_to_adapter.get(name)
 
-        adapter = self._tool_to_adapter[name]
+        # Compatibility path: some code uses add_adapter() (no registration),
+        # but ToolsNamespace still discovers tools via adapter.list_tools().
+        if adapter is None:
+            adapter = self.find_adapter_for_tool(name)
+            if adapter is None:
+                available = [t.name for t in self.get_all_tools()]
+                raise ToolNotFoundError(name, available)
 
         try:
             return await adapter.call_tool(name, callable_name, args)
@@ -501,6 +535,43 @@ async def close(self) -> None:
         self._tool_to_adapter.clear()
         self._vectors.clear()
 
+    # -------------------------------------------------------------------------
+    # Middleware
+    # -------------------------------------------------------------------------
+
+    def apply_tool_middlewares(
+        self,
+        middlewares: Sequence[ToolMiddleware],
+        *,
+        executor_type: str | None = None,
+        origin: str | None = None,
+    ) -> None:
+        """Apply tool call middleware chain to all adapters.
+
+        This method mutates the registry in-place and updates internal mappings
+        so that *all* tool call paths (ToolsNamespace, RPC providers, registry.call_tool)
+        are routed through the middleware chain.
+
+        Notes:
+        - Only `call_tool()` is wrapped. `list_tools()` and `describe()` are passed through.
+        - Applying multiple times replaces the active middleware chain.
+        """
+        self._tool_middlewares = tuple(middlewares)
+        self._tool_middleware_executor_type = executor_type
+        self._tool_middleware_origin = origin
+
+        base_adapters = [self._unwrap_adapter(a) for a in self._adapters]
+        wrapped_adapters = [self._wrap_adapter_if_needed(a) for a in base_adapters]
+        base_to_wrapped = {id(b): w for b, w in zip(base_adapters, wrapped_adapters, strict=True)}
+        self._adapters = wrapped_adapters
+
+        # Update tool->adapter mapping used by registry.call_tool().
+        for tool_name, adapter in list(self._tool_to_adapter.items()):
+            base = self._unwrap_adapter(adapter)
+            mapped = base_to_wrapped.get(id(base))
+            if mapped is not None:
+                self._tool_to_adapter[tool_name] = mapped
+
 
 class ScopedToolRegistry:
     """A scoped view of a ToolRegistry that only exposes matching tools.
diff --git a/tests/conftest.py b/tests/conftest.py
index 5c6c8cf..b480a9c 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -59,6 +59,16 @@ def _patched_embedder_init(self, model_name=None, start_loading=False):
     TESTCONTAINERS_AVAILABLE = False
 
 
+def _docker_daemon_is_available() -> bool:
+    try:
+        import docker
+
+        docker.from_env().ping()
+        return True
+    except Exception:
+        return False
+
+
 # =============================================================================
 # Docker Image Staleness Check
 # =============================================================================
@@ -211,13 +221,22 @@ def docker_image_check():
 
 def pytest_collection_modifyitems(config, items):  # noqa: ARG001
     """Add docker_image_check fixture to all tests in xdist_group('docker')."""
+    docker_fixtures = {"redis_container", "redis_client", "redis_url"}
     for item in items:
+        if docker_fixtures.intersection(getattr(item, "fixturenames", ())):
+            item.add_marker(pytest.mark.docker)
+
         # Check if test is in the docker xdist group
         for marker in item.iter_markers("xdist_group"):
             if marker.args and marker.args[0] == "docker":
+                item.add_marker(pytest.mark.docker)
                 # Add the fixture as a dependency
                 if "docker_image_check" not in item.fixturenames:
                     item.fixturenames.insert(0, "docker_image_check")
+            elif marker.args and marker.args[0] == "subprocess":
+                item.add_marker(pytest.mark.subprocess)
+            elif marker.args and marker.args[0] == "venv":
+                item.add_marker(pytest.mark.venv)
 
 
 class MockAdapter:
@@ -781,6 +800,12 @@ def redis_container():
     """
     if not TESTCONTAINERS_AVAILABLE:
         pytest.skip("testcontainers[redis] not installed")
+    if not _docker_daemon_is_available():
+        if os.environ.get("CI"):
+            pytest.fail(
+                "Docker daemon not available for testcontainers Redis (CI should provide Docker)"
+            )
+        pytest.skip("Docker daemon not available for testcontainers Redis")
 
     with RedisContainer(image="redis:7-alpine") as container:
         yield container
diff --git a/tests/test_async_sandbox_interfaces.py b/tests/test_async_sandbox_interfaces.py
new file mode 100644
index 0000000..abf89e1
--- /dev/null
+++ b/tests/test_async_sandbox_interfaces.py
@@ -0,0 +1,143 @@
+import os
+from pathlib import Path
+
+import pytest
+
+
+@pytest.mark.asyncio
+async def test_inprocess_executor_tools_and_artifacts_are_sync_in_agent_code(
+    tmp_path: Path,
+) -> None:
+    from py_code_mode.execution import InProcessConfig, InProcessExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+    (tools_dir / "echo.yaml").write_text(
+        "\n".join(
+            [
+                "name: echo",
+                "description: Echo text",
+                "command: /bin/echo",
+                "timeout: 5",
+                "schema:",
+                "  positional:",
+                "    - name: message",
+                "      type: string",
+                "      required: true",
+                "      description: message",
+                "recipes:",
+                "  say:",
+                "    description: Echo message",
+                "    params:",
+                "      message: {}",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    storage = FileStorage(tmp_path / "storage")
+    executor = InProcessExecutor(config=InProcessConfig(tools_path=tools_dir))
+
+    async with Session(storage=storage, executor=executor) as session:
+        r_list = await session.run("_ts = tools.list()\nsorted([t.name for t in _ts])")
+        assert r_list.error is None
+        assert "echo" in r_list.value
+
+        r_call = await session.run("tools.echo.say(message='hi').strip()")
+        assert r_call.error is None
+        assert r_call.value == "hi"
+
+        r_art = await session.run(
+            "\n".join(
+                [
+                    "artifacts.save('obj', {'a': 1}, description='')",
+                    "artifacts.load('obj')['a']",
+                ]
+            )
+        )
+        assert r_art.error is None
+        assert r_art.value == 1
+
+
+pytestmark_subprocess = pytest.mark.skipif(
+    os.environ.get("PY_CODE_MODE_TEST_SUBPROCESS") == "0",
+    reason="Subprocess async-sandbox smoke can be disabled with PY_CODE_MODE_TEST_SUBPROCESS=0",
+)
+
+
+@pytestmark_subprocess
+@pytest.mark.asyncio
+async def test_subprocess_executor_tools_workflows_artifacts_are_sync_in_agent_code(
+    tmp_path: Path,
+) -> None:
+    from py_code_mode.execution import SubprocessConfig, SubprocessExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+    (tools_dir / "echo.yaml").write_text(
+        "\n".join(
+            [
+                "name: echo",
+                "description: Echo text",
+                "command: /bin/echo",
+                "timeout: 5",
+                "schema:",
+                "  positional:",
+                "    - name: message",
+                "      type: string",
+                "      required: true",
+                "      description: message",
+                "recipes:",
+                "  say:",
+                "    description: Echo message",
+                "    params:",
+                "      message: {}",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    storage = FileStorage(tmp_path / "storage")
+    executor = SubprocessExecutor(
+        config=SubprocessConfig(tools_path=tools_dir, default_timeout=60.0)
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r_list = await session.run(
+            "_ts = tools.list()\nsorted([t['name'] for t in _ts])",
+        )
+        assert r_list.error is None
+        assert "echo" in r_list.value
+
+        r_call = await session.run("tools.echo.say(message='hi').strip()")
+        assert r_call.error is None
+        assert r_call.value == "hi"
+
+        source = "async def run(name: str) -> str:\n    return 'hi ' + name\n"
+        r_wf = await session.run(
+            "\n".join(
+                [
+                    f"workflows.create('hello', {source!r}, 'desc')",
+                    "workflows.get('hello')['source']",
+                ]
+            )
+        )
+        assert r_wf.error is None
+        assert r_wf.value == source
+
+        r_art = await session.run(
+            "\n".join(
+                [
+                    "artifacts.save('obj', {'a': 1}, description='')",
+                    "artifacts.load('obj')['a']",
+                ]
+            )
+        )
+        assert r_art.error is None
+        assert r_art.value == 1
diff --git a/tests/test_backend.py b/tests/test_backend.py
index f899c78..fdc3540 100644
--- a/tests/test_backend.py
+++ b/tests/test_backend.py
@@ -102,106 +102,6 @@ async def test_context_manager_support(self, tmp_path) -> None:
         # After exit, resources should be released
 
 
-class TestCapabilityConstants:
-    """Tests for Capability constants."""
-
-    def test_timeout_capability_exists(self) -> None:
-        """TIMEOUT capability must be defined."""
-        assert hasattr(Capability, "TIMEOUT")
-        assert Capability.TIMEOUT == "timeout"
-
-    def test_process_isolation_capability_exists(self) -> None:
-        """PROCESS_ISOLATION capability must be defined."""
-        assert hasattr(Capability, "PROCESS_ISOLATION")
-        assert Capability.PROCESS_ISOLATION == "process_isolation"
-
-    def test_network_isolation_capability_exists(self) -> None:
-        """NETWORK_ISOLATION capability must be defined."""
-        assert hasattr(Capability, "NETWORK_ISOLATION")
-        assert Capability.NETWORK_ISOLATION == "network_isolation"
-
-    def test_network_filtering_capability_exists(self) -> None:
-        """NETWORK_FILTERING capability must be defined."""
-        assert hasattr(Capability, "NETWORK_FILTERING")
-        assert Capability.NETWORK_FILTERING == "network_filtering"
-
-    def test_filesystem_isolation_capability_exists(self) -> None:
-        """FILESYSTEM_ISOLATION capability must be defined."""
-        assert hasattr(Capability, "FILESYSTEM_ISOLATION")
-        assert Capability.FILESYSTEM_ISOLATION == "filesystem_isolation"
-
-    def test_memory_limit_capability_exists(self) -> None:
-        """MEMORY_LIMIT capability must be defined."""
-        assert hasattr(Capability, "MEMORY_LIMIT")
-        assert Capability.MEMORY_LIMIT == "memory_limit"
-
-    def test_cpu_limit_capability_exists(self) -> None:
-        """CPU_LIMIT capability must be defined."""
-        assert hasattr(Capability, "CPU_LIMIT")
-        assert Capability.CPU_LIMIT == "cpu_limit"
-
-    def test_reset_capability_exists(self) -> None:
-        """RESET capability must be defined."""
-        assert hasattr(Capability, "RESET")
-        assert Capability.RESET == "reset"
-
-    def test_all_returns_set_of_all_capabilities(self) -> None:
-        """Capability.all() must return set of all defined capabilities."""
-        all_caps = Capability.all()
-
-        assert isinstance(all_caps, set)
-        assert Capability.TIMEOUT in all_caps
-        assert Capability.NETWORK_ISOLATION in all_caps
-        assert len(all_caps) >= 8  # At least 8 capabilities defined
-
-
-class TestExecutionResult:
-    """Tests for the unified ExecutionResult type."""
-
-    def test_result_has_value(self) -> None:
-        """ExecutionResult must have value field."""
-        result = ExecutionResult(value=42, stdout="", error=None)
-        assert result.value == 42
-
-    def test_result_has_stdout(self) -> None:
-        """ExecutionResult must have stdout field."""
-        result = ExecutionResult(value=None, stdout="output", error=None)
-        assert result.stdout == "output"
-
-    def test_result_has_error(self) -> None:
-        """ExecutionResult must have error field."""
-        result = ExecutionResult(value=None, stdout="", error="Something broke")
-        assert result.error == "Something broke"
-
-    def test_result_is_ok_property(self) -> None:
-        """ExecutionResult must have is_ok property."""
-        success = ExecutionResult(value=42, stdout="", error=None)
-        failure = ExecutionResult(value=None, stdout="", error="oops")
-
-        assert success.is_ok is True
-        assert failure.is_ok is False
-
-    def test_result_has_optional_execution_time(self) -> None:
-        """ExecutionResult may have execution_time_ms field."""
-        result = ExecutionResult(
-            value=42,
-            stdout="",
-            error=None,
-            execution_time_ms=123.45,
-        )
-        assert result.execution_time_ms == 123.45
-
-    def test_result_has_optional_backend_info(self) -> None:
-        """ExecutionResult may have backend_info dict."""
-        result = ExecutionResult(
-            value=42,
-            stdout="",
-            error=None,
-            backend_info={"session_id": "abc123"},
-        )
-        assert result.backend_info["session_id"] == "abc123"
-
-
 class TestBackendRegistry:
     """Tests for backend registration and discovery."""
 
diff --git a/tests/test_deno_sandbox_executor.py b/tests/test_deno_sandbox_executor.py
new file mode 100644
index 0000000..2c57ee6
--- /dev/null
+++ b/tests/test_deno_sandbox_executor.py
@@ -0,0 +1,755 @@
+import hashlib
+import math
+import os
+from dataclasses import dataclass
+from pathlib import Path
+
+import pytest
+
+pytestmark = pytest.mark.skipif(
+    os.environ.get("PY_CODE_MODE_TEST_DENO") != "1",
+    reason="Set PY_CODE_MODE_TEST_DENO=1 to run Deno/Pyodide integration tests.",
+)
+
+
+class _StableEmbedder:
+    """Deterministic lightweight embedder for integration tests.
+
+    Avoids pulling large sentence-transformers models while still exercising
+    semantic-search codepaths.
+    """
+
+    def __init__(self, dimension: int = 64) -> None:
+        self._dimension = dimension
+
+    @property
+    def dimension(self) -> int:
+        return self._dimension
+
+    def _embed_one(self, text: str) -> list[float]:
+        vec = [0.0] * self._dimension
+        for token in "".join(c.lower() if c.isalnum() else " " for c in text).split():
+            h = hashlib.sha256(token.encode("utf-8")).digest()
+            idx = int.from_bytes(h[:4], "big") % self._dimension
+            vec[idx] += 1.0
+        norm = math.sqrt(sum(v * v for v in vec)) or 1.0
+        return [v / norm for v in vec]
+
+    def embed(self, texts: list[str]) -> list[list[float]]:
+        return [self._embed_one(t) for t in texts]
+
+    def embed_query(self, query: str) -> list[float]:
+        return self._embed_one(query)
+
+
+@dataclass
+class _TestStorage:
+    """Minimal StorageBackend for exercising workflows/artifacts via RPC."""
+
+    root: Path
+
+    def __post_init__(self) -> None:
+        self.root.mkdir(parents=True, exist_ok=True)
+
+        from py_code_mode.artifacts import FileArtifactStore
+        from py_code_mode.workflows import FileWorkflowStore, WorkflowLibrary
+
+        self._artifact_store = FileArtifactStore(self.root / "artifacts")
+        self._workflow_store = FileWorkflowStore(self.root / "workflows")
+        self._workflow_library = WorkflowLibrary(
+            embedder=_StableEmbedder(),
+            store=self._workflow_store,
+            vector_store=None,
+        )
+
+    def get_serializable_access(self):
+        from py_code_mode.execution.protocol import FileStorageAccess
+
+        return FileStorageAccess(
+            workflows_path=self.root / "workflows",
+            artifacts_path=self.root / "artifacts",
+            vectors_path=None,
+        )
+
+    def get_workflow_library(self):
+        return self._workflow_library
+
+    def get_artifact_store(self):
+        return self._artifact_store
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_basic(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r1 = await session.run("1 + 1")
+        assert r1.error is None
+        assert r1.value == 2
+
+        r2 = await session.run("x = 40")
+        assert r2.error is None
+
+        r3 = await session.run("x + 2")
+        assert r3.error is None
+        assert r3.value == 42
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_deps_add_installs(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=300.0,
+            deps_timeout=300.0,
+            ipc_timeout=120.0,
+            network_profile="deps-only",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "await deps.add('packaging')\nimport packaging\npackaging.__version__"
+        )
+        assert r.error is None
+        assert isinstance(r.value, str)
+        assert r.value
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_sync_deps_on_start(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            deps_timeout=300.0,
+            ipc_timeout=120.0,
+            deps=("packaging",),
+            network_profile="deps-only",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor, sync_deps_on_start=True) as session:
+        r = await session.run("import packaging\npackaging.__version__")
+        assert r.error is None
+        assert isinstance(r.value, str)
+        assert r.value
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_network_none_blocks_installs(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=120.0,
+            deps_timeout=120.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "await deps.add('packaging')\nimport packaging\npackaging.__version__"
+        )
+        assert r.error is not None
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_artifacts_roundtrip(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "await artifacts.save('obj', {'a': 1, 'b': [2, 3]}, description='t')\n"
+            "(await artifacts.load('obj'))['b'][1]"
+        )
+        assert r.error is None
+        assert r.value == 3
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_workflows_roundtrip(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    source = "async def run(name: str) -> str:\n    return 'hi ' + name\n"
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "await workflows.create('hello', "
+            f"{source!r}, "
+            "'test wf')\n"
+            "(await workflows.get('hello'))['source']"
+        )
+        assert r.error is None
+        assert r.value == source
+
+        r2 = await session.run("await workflows.invoke('hello', name='py-code-mode')")
+        assert r2.error is None
+        assert r2.value == "hi py-code-mode"
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_workflow_calls_other_workflow(tmp_path: Path) -> None:
+    """Ensure a workflow can invoke another workflow inside the sandbox."""
+
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    src_double = "async def run(x: int) -> int:\n    return x * 2\n"
+    src_quadruple = (
+        "async def run(x: int) -> int:\n"
+        "    d = await workflows.invoke(workflow_name='double', x=x)\n"
+        "    return await workflows.invoke(workflow_name='double', x=d)\n"
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r1 = await session.run(f"await workflows.create('double', {src_double!r}, 'double')")
+        assert r1.error is None
+
+        r2 = await session.run(
+            f"await workflows.create('quadruple', {src_quadruple!r}, 'quadruple')"
+        )
+        assert r2.error is None
+
+        r3 = await session.run("await workflows.invoke('quadruple', x=10)")
+        assert r3.error is None
+        assert r3.value == 40
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_tools_via_rpc(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+    (tools_dir / "echo.yaml").write_text(
+        "\n".join(
+            [
+                "name: echo",
+                "description: Echo text",
+                "command: /bin/echo",
+                "timeout: 5",
+                "schema:",
+                "  positional:",
+                "    - name: message",
+                "      type: string",
+                "      required: true",
+                "      description: message",
+                "recipes:",
+                "  say:",
+                "    description: Echo message",
+                "    params:",
+                "      message: {}",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            tools_path=tools_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r_list = await session.run("_ts = await tools.list()\nsorted([t['name'] for t in _ts])")
+        assert r_list.error is None
+        assert "echo" in r_list.value
+
+        r = await session.run("(await tools.echo.say(message='hi')).strip()")
+        assert r.error is None
+        assert r.value == "hi"
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_tool_middleware_is_invoked(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+    from py_code_mode.tools import ToolCallContext, ToolMiddleware
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+    (tools_dir / "echo.yaml").write_text(
+        "\n".join(
+            [
+                "name: echo",
+                "description: Echo text",
+                "command: /bin/echo",
+                "timeout: 5",
+                "schema:",
+                "  positional:",
+                "    - name: message",
+                "      type: string",
+                "      required: true",
+                "      description: message",
+                "recipes:",
+                "  say:",
+                "    description: Echo message",
+                "    params:",
+                "      message: {}",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    events: list[str] = []
+
+    class _Recorder(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            events.append(f"pre:{ctx.full_name}:{ctx.executor_type}:{ctx.origin}")
+            out = await call_next(ctx)
+            events.append(f"post:{ctx.full_name}")
+            return out
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            tools_path=tools_dir,
+            tool_middlewares=(_Recorder(),),
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run("(await tools.echo.say(message='hi')).strip()")
+        assert r.error is None
+        assert r.value == "hi"
+
+    assert events == [
+        "pre:echo.say:deno-sandbox:deno-sandbox",
+        "post:echo.say",
+    ]
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_tool_large_output_is_chunked(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+    (tools_dir / "pyrun.yaml").write_text(
+        "\n".join(
+            [
+                "name: pyrun",
+                "description: Run Python snippet",
+                "command: python",
+                "timeout: 10",
+                "schema:",
+                "  options:",
+                "    command:",
+                "      type: string",
+                "      short: c",
+                "      description: code snippet",
+                "recipes:",
+                "  run:",
+                "    description: Run snippet via -c",
+                "    params:",
+                "      command: {}",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            tools_path=tools_dir,
+            default_timeout=180.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "\n".join(
+                [
+                    "code = \"import sys; sys.stdout.write('x' * (2 * 1024 * 1024))\"",
+                    "len(await tools.pyrun.run(command=code))",
+                ]
+            )
+        )
+        assert r.error is None
+        assert r.value == 2 * 1024 * 1024
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_rpc_does_not_deadlock(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=15.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r = await session.run(
+            "\n".join(
+                [
+                    "await artifacts.save('x', {'n': 1}, description='')",
+                    "s = 0",
+                    "for _ in range(50):",
+                    "    if await artifacts.exists('x'):",
+                    "        s += (await artifacts.load('x'))['n']",
+                    "s",
+                ]
+            )
+        )
+        assert r.error is None
+        assert r.value == 50
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_reset_clears_state(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r1 = await session.run("x = 1\nx")
+        assert r1.error is None
+        assert r1.value == 1
+
+        await session.reset()
+
+        r2 = await session.run("x")
+        assert r2.error is not None
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_session_add_dep_installs(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=300.0,
+            deps_timeout=300.0,
+            ipc_timeout=120.0,
+            network_profile="deps-only",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        out = await session.add_dep("packaging")
+        assert out["failed"] == []
+
+        r = await session.run("import packaging\npackaging.__version__")
+        assert r.error is None
+        assert isinstance(r.value, str)
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_mcp_tool_via_rpc(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    tools_dir = tmp_path / "tools"
+    tools_dir.mkdir(parents=True, exist_ok=True)
+
+    # Local stdio MCP server using fastmcp.
+    mcp_server = tmp_path / "mcp_server.py"
+    mcp_server.write_text(
+        "\n".join(
+            [
+                "from fastmcp import FastMCP",
+                "",
+                "mcp = FastMCP('test')",
+                "",
+                "@mcp.tool",
+                "async def add(a: int, b: int) -> str:",
+                "    return str(a + b)",
+                "",
+                "if __name__ == '__main__':",
+                "    mcp.run()",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    (tools_dir / "math.yaml").write_text(
+        "\n".join(
+            [
+                "name: math",
+                "type: mcp",
+                "transport: stdio",
+                "command: python",
+                f"args: [{mcp_server!s}]",
+                "description: Simple math MCP server",
+                "",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            tools_path=tools_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r_list = await session.run("_ts = await tools.list()\nsorted([t['name'] for t in _ts])")
+        assert r_list.error is None
+        assert "math" in r_list.value
+
+        r = await session.run("(await tools.math.add(a=2, b=3)).strip()")
+        assert r.error is None
+        assert r.value == "5"
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_workflows_search_via_rpc(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+
+    storage = _TestStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=60.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    src = "async def run() -> str:\n    return 'hello world'\n"
+
+    async with Session(storage=storage, executor=executor) as session:
+        r1 = await session.run(f"await workflows.create('wf', {src!r}, 'greeting workflow')")
+        assert r1.error is None
+
+        r2 = await session.run("(await workflows.search('greeting', limit=5))[0]['name']")
+        assert r2.error is None
+        assert r2.value == "wf"
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_artifact_payload_size_limits(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    store = storage.get_artifact_store()
+    store.save("small", "x" * (200 * 1024), description="")
+    store.save("big", "x" * (2 * 1024 * 1024), description="")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=180.0,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r_ok = await session.run(
+            "\n".join(
+                [
+                    "len(await artifacts.load('small'))",
+                ]
+            )
+        )
+        assert r_ok.error is None
+        assert r_ok.value == 200 * 1024
+
+        r_big = await session.run(
+            "\n".join(
+                [
+                    "len(await artifacts.load('big'))",
+                ]
+            )
+        )
+        assert r_big.error is None
+        assert r_big.value == 2 * 1024 * 1024
+
+
+@pytest.mark.asyncio
+async def test_deno_sandbox_executor_soft_timeout_wedges_until_reset(tmp_path: Path) -> None:
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+    from py_code_mode.session import Session
+    from py_code_mode.storage import FileStorage
+
+    storage = FileStorage(tmp_path / "storage")
+    deno_dir = tmp_path / "deno_dir"
+    deno_dir.mkdir(parents=True, exist_ok=True)
+
+    executor = DenoSandboxExecutor(
+        DenoSandboxConfig(
+            deno_dir=deno_dir,
+            default_timeout=0.05,
+            ipc_timeout=120.0,
+            network_profile="none",
+        )
+    )
+
+    async with Session(storage=storage, executor=executor) as session:
+        r1 = await session.run("import time\ntime.sleep(0.2)\n1")
+        assert r1.error is not None
+        assert "timeout" in r1.error.lower()
+
+        r2 = await session.run("1 + 1")
+        assert r2.error is not None
+        assert "previous execution timed out" in r2.error.lower()
+
+        await session.reset()
+
+        r3 = await session.run("1 + 1")
+        assert r3.error is None
+        assert r3.value == 2
diff --git a/tests/test_deno_sandbox_imports.py b/tests/test_deno_sandbox_imports.py
new file mode 100644
index 0000000..b16fe5d
--- /dev/null
+++ b/tests/test_deno_sandbox_imports.py
@@ -0,0 +1,13 @@
+import pytest
+
+
+def test_deno_sandbox_imports() -> None:
+    from py_code_mode.execution import DENO_SANDBOX_AVAILABLE
+
+    if not DENO_SANDBOX_AVAILABLE:
+        pytest.skip("Deno sandbox backend is optional and not available in this environment.")
+
+    from py_code_mode.execution import DenoSandboxConfig, DenoSandboxExecutor
+
+    assert DenoSandboxConfig is not None
+    assert DenoSandboxExecutor is not None
diff --git a/tests/test_deps_installer.py b/tests/test_deps_installer.py
index cc9c076..6b4f4c1 100644
--- a/tests/test_deps_installer.py
+++ b/tests/test_deps_installer.py
@@ -121,59 +121,6 @@ async def test_developer_adds_more_deps_after_sync(self, tmp_path: Path) -> None
             assert "numpy" in result.installed
 
 
-# =============================================================================
-# Contract Tests (SyncResult)
-# =============================================================================
-
-
-class TestSyncResultContract:
-    """Tests for SyncResult dataclass/structure."""
-
-    def test_sync_result_has_installed_attribute(self) -> None:
-        """SyncResult has 'installed' attribute (set of packages).
-
-        Breaks when: SyncResult structure is wrong.
-        """
-        from py_code_mode.deps import SyncResult
-
-        result = SyncResult(installed=set(), already_present=set(), failed=set())
-        assert hasattr(result, "installed")
-        assert isinstance(result.installed, set)
-
-    def test_sync_result_has_already_present_attribute(self) -> None:
-        """SyncResult has 'already_present' attribute (set of packages).
-
-        Breaks when: SyncResult structure is wrong.
-        """
-        from py_code_mode.deps import SyncResult
-
-        result = SyncResult(installed=set(), already_present=set(), failed=set())
-        assert hasattr(result, "already_present")
-        assert isinstance(result.already_present, set)
-
-    def test_sync_result_has_failed_attribute(self) -> None:
-        """SyncResult has 'failed' attribute (set of packages).
-
-        Breaks when: SyncResult structure is wrong.
-        """
-        from py_code_mode.deps import SyncResult
-
-        result = SyncResult(installed=set(), already_present=set(), failed=set())
-        assert hasattr(result, "failed")
-        assert isinstance(result.failed, set)
-
-    def test_sync_result_is_dataclass(self) -> None:
-        """SyncResult is a dataclass for easy construction.
-
-        Breaks when: SyncResult is not a dataclass.
-        """
-        from dataclasses import is_dataclass
-
-        from py_code_mode.deps import SyncResult
-
-        assert is_dataclass(SyncResult)
-
-
 # =============================================================================
 # PackageInstaller Contract Tests
 # =============================================================================
@@ -182,17 +129,6 @@ def test_sync_result_is_dataclass(self) -> None:
 class TestPackageInstallerContract:
     """Tests for PackageInstaller public API."""
 
-    def test_installer_has_sync_method(self) -> None:
-        """PackageInstaller has sync(store) method.
-
-        Breaks when: sync method is missing.
-        """
-        from py_code_mode.deps import PackageInstaller
-
-        installer = PackageInstaller()
-        assert hasattr(installer, "sync")
-        assert callable(installer.sync)
-
     def test_sync_returns_sync_result(self, tmp_path: Path) -> None:
         """sync() returns SyncResult.
 
@@ -576,7 +512,6 @@ def test_installer_default_timeout(self) -> None:
         from py_code_mode.deps import PackageInstaller
 
         installer = PackageInstaller()
-        assert hasattr(installer, "timeout")
         assert installer.timeout >= 60  # At least 60 seconds
 
     def test_installer_accepts_extra_pip_args(self, tmp_path: Path) -> None:
diff --git a/tests/test_deps_namespace.py b/tests/test_deps_namespace.py
index b7c1819..6687d5b 100644
--- a/tests/test_deps_namespace.py
+++ b/tests/test_deps_namespace.py
@@ -150,62 +150,6 @@ def test_agent_syncs_all_deps(self, tmp_path: Path) -> None:
 class TestDepsNamespaceContract:
     """Tests for DepsNamespace public API."""
 
-    def test_namespace_has_add_method(self, tmp_path: Path) -> None:
-        """DepsNamespace has add(package) method.
-
-        Breaks when: add method is missing.
-        """
-        from py_code_mode.deps import DepsNamespace, FileDepsStore, PackageInstaller
-
-        store = FileDepsStore(tmp_path)
-        installer = PackageInstaller()
-        namespace = DepsNamespace(store=store, installer=installer)
-
-        assert hasattr(namespace, "add")
-        assert callable(namespace.add)
-
-    def test_namespace_has_list_method(self, tmp_path: Path) -> None:
-        """DepsNamespace has list() method.
-
-        Breaks when: list method is missing.
-        """
-        from py_code_mode.deps import DepsNamespace, FileDepsStore, PackageInstaller
-
-        store = FileDepsStore(tmp_path)
-        installer = PackageInstaller()
-        namespace = DepsNamespace(store=store, installer=installer)
-
-        assert hasattr(namespace, "list")
-        assert callable(namespace.list)
-
-    def test_namespace_has_remove_method(self, tmp_path: Path) -> None:
-        """DepsNamespace has remove(package) method.
-
-        Breaks when: remove method is missing.
-        """
-        from py_code_mode.deps import DepsNamespace, FileDepsStore, PackageInstaller
-
-        store = FileDepsStore(tmp_path)
-        installer = PackageInstaller()
-        namespace = DepsNamespace(store=store, installer=installer)
-
-        assert hasattr(namespace, "remove")
-        assert callable(namespace.remove)
-
-    def test_namespace_has_sync_method(self, tmp_path: Path) -> None:
-        """DepsNamespace has sync() method.
-
-        Breaks when: sync method is missing.
-        """
-        from py_code_mode.deps import DepsNamespace, FileDepsStore, PackageInstaller
-
-        store = FileDepsStore(tmp_path)
-        installer = PackageInstaller()
-        namespace = DepsNamespace(store=store, installer=installer)
-
-        assert hasattr(namespace, "sync")
-        assert callable(namespace.sync)
-
     def test_list_returns_list_of_strings(self, tmp_path: Path) -> None:
         """list() returns list[str].
 
diff --git a/tests/test_deps_store.py b/tests/test_deps_store.py
index 412d35b..1275127 100644
--- a/tests/test_deps_store.py
+++ b/tests/test_deps_store.py
@@ -48,51 +48,6 @@ def test_redis_deps_store_is_deps_store(self, mock_redis: "MockRedisClient") ->
         store = RedisDepsStore(mock_redis, prefix="test")
         assert isinstance(store, DepsStore)
 
-    def test_protocol_requires_list_method(self) -> None:
-        """DepsStore protocol requires list() -> list[str].
-
-        Breaks when: Protocol doesn't define list method.
-        """
-        from py_code_mode.deps import DepsStore
-
-        assert hasattr(DepsStore, "list")
-
-    def test_protocol_requires_add_method(self) -> None:
-        """DepsStore protocol requires add(package: str) -> None.
-
-        Breaks when: Protocol doesn't define add method.
-        """
-        from py_code_mode.deps import DepsStore
-
-        assert hasattr(DepsStore, "add")
-
-    def test_protocol_requires_remove_method(self) -> None:
-        """DepsStore protocol requires remove(package: str) -> bool.
-
-        Breaks when: Protocol doesn't define remove method.
-        """
-        from py_code_mode.deps import DepsStore
-
-        assert hasattr(DepsStore, "remove")
-
-    def test_protocol_requires_clear_method(self) -> None:
-        """DepsStore protocol requires clear() -> None.
-
-        Breaks when: Protocol doesn't define clear method.
-        """
-        from py_code_mode.deps import DepsStore
-
-        assert hasattr(DepsStore, "clear")
-
-    def test_protocol_requires_hash_method(self) -> None:
-        """DepsStore protocol requires hash() -> str.
-
-        Breaks when: Protocol doesn't define hash method.
-        """
-        from py_code_mode.deps import DepsStore
-
-        assert hasattr(DepsStore, "hash")
-
 
 # =============================================================================
 # FileDepsStore Tests
diff --git a/tests/test_error_handling.py b/tests/test_error_handling.py
index c4f1f4c..8fa23cc 100644
--- a/tests/test_error_handling.py
+++ b/tests/test_error_handling.py
@@ -167,71 +167,43 @@ def hlen(self, key: str) -> int:
 
 
 class TestStorageExceptionHierarchy:
-    """Tests for new exception types that need to be added.
-
-    These tests will FAIL until the exceptions are added to errors.py:
-    - StorageError (base)
-    - StorageReadError (read failures)
-    - StorageWriteError (write failures)
-    - ConfigurationError (invalid configuration)
-    """
+    """Tests for storage/configuration exception hierarchy."""
 
     def test_storage_error_exists(self):
-        """StorageError should be defined in errors module."""
-        from py_code_mode import errors
-
-        assert hasattr(errors, "StorageError"), (
-            "StorageError not defined. Add to py_code_mode/errors.py:\n"
-            "class StorageError(CodeModeError):\n"
-            '    """Base class for storage-related errors."""\n'
-            "    pass"
-        )
+        """StorageError is defined and inherits from CodeModeError."""
+        from py_code_mode.errors import StorageError
+
+        assert issubclass(StorageError, CodeModeError)
 
     def test_storage_read_error_exists(self):
         """StorageReadError should be defined and inherit from StorageError."""
-        from py_code_mode import errors
+        from py_code_mode.errors import StorageError, StorageReadError
 
-        assert hasattr(errors, "StorageReadError"), (
-            "StorageReadError not defined. Add to py_code_mode/errors.py"
-        )
-        # This will fail until both are defined
-        if hasattr(errors, "StorageError") and hasattr(errors, "StorageReadError"):
-            assert issubclass(errors.StorageReadError, errors.StorageError)
+        assert issubclass(StorageReadError, StorageError)
 
     def test_storage_write_error_exists(self):
         """StorageWriteError should be defined and inherit from StorageError."""
-        from py_code_mode import errors
+        from py_code_mode.errors import StorageError, StorageWriteError
 
-        assert hasattr(errors, "StorageWriteError"), (
-            "StorageWriteError not defined. Add to py_code_mode/errors.py"
-        )
-        if hasattr(errors, "StorageError") and hasattr(errors, "StorageWriteError"):
-            assert issubclass(errors.StorageWriteError, errors.StorageError)
+        assert issubclass(StorageWriteError, StorageError)
 
     def test_configuration_error_exists(self):
         """ConfigurationError should be defined."""
-        from py_code_mode import errors
+        from py_code_mode.errors import ConfigurationError
 
-        assert hasattr(errors, "ConfigurationError"), (
-            "ConfigurationError not defined. Add to py_code_mode/errors.py"
-        )
-        if hasattr(errors, "ConfigurationError"):
-            assert issubclass(errors.ConfigurationError, CodeModeError)
+        assert issubclass(ConfigurationError, CodeModeError)
 
     def test_storage_read_error_preserves_cause(self):
         """StorageReadError should preserve the original exception as __cause__."""
-        from py_code_mode import errors
-
-        if not hasattr(errors, "StorageReadError"):
-            pytest.skip("StorageReadError not yet implemented")
+        from py_code_mode.errors import StorageReadError
 
         original = ValueError("original error")
         try:
             try:
                 raise original
             except ValueError as e:
-                raise errors.StorageReadError("read failed", path="/some/path") from e
-        except errors.StorageReadError as err:
+                raise StorageReadError("read failed", path="/some/path") from e
+        except StorageReadError as err:
             assert err.__cause__ is original
             assert "read failed" in str(err)
             assert hasattr(err, "path") or "/some/path" in str(err)
@@ -446,28 +418,13 @@ def test_load_returns_none_for_missing_file(self, tmp_path: Path):
 
         assert result is None  # Expected behavior
 
-    def test_load_raises_for_syntax_error(
-        self, workflows_dir_with_corruption: Path, log_capture: pytest.LogCaptureFixture
-    ):
+    def test_load_raises_for_syntax_error(self, workflows_dir_with_corruption: Path):
         """load() should raise StorageReadError for Python syntax errors."""
+        from py_code_mode.errors import StorageReadError
         from py_code_mode.workflows import FileWorkflowStore
 
         store = FileWorkflowStore(workflows_dir_with_corruption)
-
-        from py_code_mode import errors
-
-        if not hasattr(errors, "StorageReadError"):
-            # Current behavior: returns None with warning
-            result = store.load("syntax_error")
-            if result is None:
-                # Check at least warning is logged (current behavior has this)
-                assert any("syntax_error" in record.message for record in log_capture.records), (
-                    "At minimum, a warning should be logged for syntax errors"
-                )
-            pytest.skip("StorageReadError not yet implemented - upgrade test when added")
-
-        # After fix: should raise StorageReadError
-        with pytest.raises(errors.StorageReadError):
+        with pytest.raises(StorageReadError):
             store.load("syntax_error")
 
 
@@ -514,49 +471,22 @@ def test_load_returns_none_for_missing_key(self, mock_redis_with_corruption):
 
         assert result is None
 
-    def test_load_raises_for_invalid_json(
-        self, mock_redis_with_corruption, log_capture: pytest.LogCaptureFixture
-    ):
+    def test_load_raises_for_invalid_json(self, mock_redis_with_corruption):
         """load() should raise StorageReadError for invalid JSON."""
+        from py_code_mode.errors import StorageReadError
         from py_code_mode.workflows import RedisWorkflowStore
 
         store = RedisWorkflowStore(mock_redis_with_corruption, prefix="workflows")
-
-        from py_code_mode import errors
-
-        if not hasattr(errors, "StorageReadError"):
-            # Current behavior: returns None with warning
-            result = store.load("corrupt_json")
-            if result is None:
-                # At least check warning is logged
-                assert any("corrupt_json" in record.message for record in log_capture.records), (
-                    "Warning should be logged for corrupt JSON"
-                )
-            pytest.skip("StorageReadError not yet implemented")
-
-        # After fix: should raise StorageReadError
-        with pytest.raises(errors.StorageReadError):
+        with pytest.raises(StorageReadError):
             store.load("corrupt_json")
 
-    def test_load_raises_for_missing_fields(
-        self, mock_redis_with_corruption, log_capture: pytest.LogCaptureFixture
-    ):
+    def test_load_raises_for_missing_fields(self, mock_redis_with_corruption):
         """load() should raise StorageReadError for incomplete workflow data."""
+        from py_code_mode.errors import StorageReadError
         from py_code_mode.workflows import RedisWorkflowStore
 
         store = RedisWorkflowStore(mock_redis_with_corruption, prefix="workflows")
-
-        from py_code_mode import errors
-
-        if not hasattr(errors, "StorageReadError"):
-            result = store.load("missing_fields")
-            if result is None:
-                assert any("missing" in record.message.lower() for record in log_capture.records), (
-                    "Warning should be logged for missing fields"
-                )
-            pytest.skip("StorageReadError not yet implemented")
-
-        with pytest.raises(errors.StorageReadError):
+        with pytest.raises(StorageReadError):
             store.load("missing_fields")
 
     def test_list_all_logs_warning_for_corrupt_entries(
diff --git a/tests/test_executor_configs.py b/tests/test_executor_configs.py
index 0fc884f..1dd3c84 100644
--- a/tests/test_executor_configs.py
+++ b/tests/test_executor_configs.py
@@ -422,57 +422,7 @@ def test_to_docker_config_includes_deps_file(self, tmp_path: Path) -> None:
         assert str(deps_file.parent.absolute()) in docker_config["volumes"]
 
 
-class TestAllConfigsHaveNewFields:
-    """Cross-cutting tests to ensure all configs have the new fields."""
-
-    def test_all_configs_have_tools_path(self) -> None:
-        """All executor configs have tools_path field.
-
-        Contract: Consistent API across all executors.
-        Breaks when: Any config missing the field.
-        """
-        from py_code_mode.execution import ContainerConfig, InProcessConfig, SubprocessConfig
-
-        assert hasattr(InProcessConfig(), "tools_path")
-        assert hasattr(SubprocessConfig(), "tools_path")
-        assert hasattr(ContainerConfig(), "tools_path")
-
-    def test_all_configs_have_deps(self) -> None:
-        """All executor configs have deps field.
-
-        Contract: Consistent API across all executors.
-        Breaks when: Any config missing the field.
-        """
-        from py_code_mode.execution import ContainerConfig, InProcessConfig, SubprocessConfig
-
-        assert hasattr(InProcessConfig(), "deps")
-        assert hasattr(SubprocessConfig(), "deps")
-        assert hasattr(ContainerConfig(), "deps")
-
-    def test_all_configs_have_deps_file(self) -> None:
-        """All executor configs have deps_file field.
-
-        Contract: Consistent API across all executors.
-        Breaks when: Any config missing the field.
-        """
-        from py_code_mode.execution import ContainerConfig, InProcessConfig, SubprocessConfig
-
-        assert hasattr(InProcessConfig(), "deps_file")
-        assert hasattr(SubprocessConfig(), "deps_file")
-        assert hasattr(ContainerConfig(), "deps_file")
-
-    def test_all_configs_have_ipc_timeout(self) -> None:
-        """All executor configs have ipc_timeout field.
-
-        Contract: All configs support ipc_timeout.
-        Breaks when: Any config missing ipc_timeout.
-        Note: SubprocessConfig defaults to None (unlimited), others to 30.0.
-        """
-        from py_code_mode.execution import ContainerConfig, InProcessConfig, SubprocessConfig
-
-        assert hasattr(InProcessConfig(), "ipc_timeout")
-        assert hasattr(SubprocessConfig(), "ipc_timeout")
-        assert hasattr(ContainerConfig(), "ipc_timeout")
-        assert InProcessConfig().ipc_timeout == 30.0
-        assert SubprocessConfig().ipc_timeout is None
-        assert ContainerConfig().ipc_timeout == 30.0
+#
+# NOTE: Previously this file had "field presence" tests (mostly `hasattr(...)`)
+# to enforce config consistency. Those were removed as low-value/performative:
+# any real API break here should be caught by executor construction/start tests.
diff --git a/tests/test_executor_deps_methods.py b/tests/test_executor_deps_methods.py
index 05a1ed8..58d0a05 100644
--- a/tests/test_executor_deps_methods.py
+++ b/tests/test_executor_deps_methods.py
@@ -34,30 +34,6 @@
 class TestInProcessExecutorInstallDepsContract:
     """Contract tests for InProcessExecutor.install_deps()."""
 
-    def test_executor_has_install_deps_method(self) -> None:
-        """InProcessExecutor has install_deps() method.
-
-        Contract: Executor protocol requires install_deps(packages) method.
-        Breaks when: Method not implemented.
-        """
-        from py_code_mode.execution.in_process import InProcessExecutor
-
-        executor = InProcessExecutor()
-        assert hasattr(executor, "install_deps")
-        assert callable(executor.install_deps)
-
-    def test_executor_has_uninstall_deps_method(self) -> None:
-        """InProcessExecutor has uninstall_deps() method.
-
-        Contract: Executor protocol requires uninstall_deps(packages) method.
-        Breaks when: Method not implemented.
-        """
-        from py_code_mode.execution.in_process import InProcessExecutor
-
-        executor = InProcessExecutor()
-        assert hasattr(executor, "uninstall_deps")
-        assert callable(executor.uninstall_deps)
-
     def test_executor_supports_deps_install_capability(self) -> None:
         """InProcessExecutor reports DEPS_INSTALL capability.
 
@@ -482,22 +458,6 @@ class TestVenvManagerRemovePackage:
     should not run in parallel.
     """
 
-    @pytest.mark.asyncio
-    async def test_remove_package_exists(self) -> None:
-        """VenvManager has remove_package() method.
-
-        Contract: VenvManager.remove_package(venv, package) exists.
-        Breaks when: Method not implemented.
-        """
-        from py_code_mode.execution.subprocess.config import SubprocessConfig
-        from py_code_mode.execution.subprocess.venv import VenvManager
-
-        config = SubprocessConfig(python_version="3.12")
-        manager = VenvManager(config)
-
-        assert hasattr(manager, "remove_package")
-        assert callable(manager.remove_package)
-
     @pytest.mark.asyncio
     async def test_remove_package_uninstalls_from_venv(self, tmp_path: Path) -> None:
         """remove_package() uninstalls package from venv.
@@ -582,30 +542,6 @@ async def test_remove_package_validates_package_spec(self, tmp_path: Path) -> No
 class TestSubprocessExecutorDepsMethodsContract:
     """Contract tests for SubprocessExecutor.install_deps() and uninstall_deps()."""
 
-    def test_executor_has_install_deps_method(self) -> None:
-        """SubprocessExecutor has install_deps() method.
-
-        Contract: Executor protocol requires install_deps(packages) method.
-        Breaks when: Method not implemented.
-        """
-        from py_code_mode.execution.subprocess import SubprocessExecutor
-
-        executor = SubprocessExecutor()
-        assert hasattr(executor, "install_deps")
-        assert callable(executor.install_deps)
-
-    def test_executor_has_uninstall_deps_method(self) -> None:
-        """SubprocessExecutor has uninstall_deps() method.
-
-        Contract: Executor protocol requires uninstall_deps(packages) method.
-        Breaks when: Method not implemented.
-        """
-        from py_code_mode.execution.subprocess import SubprocessExecutor
-
-        executor = SubprocessExecutor()
-        assert hasattr(executor, "uninstall_deps")
-        assert callable(executor.uninstall_deps)
-
     @pytest.mark.asyncio
     async def test_install_deps_returns_dict(self, tmp_path: Path) -> None:
         """install_deps() returns dict with expected keys.
@@ -899,38 +835,6 @@ async def test_install_deps_handles_invalid_package_spec(self, tmp_path: Path) -
 # =============================================================================
 
 
-class TestDepsCapabilityConstants:
-    """Tests for DEPS_INSTALL and DEPS_UNINSTALL capability constants."""
-
-    def test_deps_install_capability_exists(self) -> None:
-        """DEPS_INSTALL capability constant exists.
-
-        Contract: Capability.DEPS_INSTALL is defined.
-        Breaks when: Constant not added to Capability class.
-        """
-        assert hasattr(Capability, "DEPS_INSTALL")
-        assert Capability.DEPS_INSTALL == "deps_install"
-
-    def test_deps_uninstall_capability_exists(self) -> None:
-        """DEPS_UNINSTALL capability constant exists.
-
-        Contract: Capability.DEPS_UNINSTALL is defined.
-        Breaks when: Constant not added to Capability class.
-        """
-        assert hasattr(Capability, "DEPS_UNINSTALL")
-        assert Capability.DEPS_UNINSTALL == "deps_uninstall"
-
-    def test_deps_capabilities_in_all_set(self) -> None:
-        """DEPS_INSTALL and DEPS_UNINSTALL in Capability.all() set.
-
-        Contract: All capabilities returned by Capability.all().
-        Breaks when: New capabilities not added to all() method.
-        """
-        all_caps = Capability.all()
-        assert Capability.DEPS_INSTALL in all_caps
-        assert Capability.DEPS_UNINSTALL in all_caps
-
-
 # =============================================================================
 # Session + Executor Integration Tests
 # =============================================================================
diff --git a/tests/test_executor_protocol.py b/tests/test_executor_protocol.py
index 7d1fde8..4e6cb5e 100644
--- a/tests/test_executor_protocol.py
+++ b/tests/test_executor_protocol.py
@@ -1,86 +1,14 @@
-"""Tests for Executor protocol changes - Step 5 of implementation plan.
+"""Executor/storage integration tests.
 
-These tests verify:
-1. Executor protocol defines start() method
-2. All executors accept StorageBackend | None (not StorageAccess)
-3. StorageBackendAccess class is deleted
-4. Each executor correctly handles StorageBackend
-
-Written to FAIL initially (TDD RED phase).
+These focus on behavior at the executor<->storage boundary, not protocol/shape
+introspection (which is brittle and mostly redundant with behavioral tests).
 """
 
 from pathlib import Path
-from typing import get_type_hints
 from unittest.mock import AsyncMock, MagicMock, patch
 
 import pytest
 
-# =============================================================================
-# Protocol Compliance Tests
-# =============================================================================
-
-
-class TestExecutorProtocolDefinesStart:
-    """Verify the Executor protocol includes start() method."""
-
-    def test_protocol_has_start_method(self) -> None:
-        """Executor protocol must define start() method."""
-        from py_code_mode.execution.protocol import Executor
-
-        # Protocol should have start method
-        assert hasattr(Executor, "start"), "Executor protocol must define start() method"
-
-    def test_protocol_start_accepts_storage_backend(self) -> None:
-        """Executor.start() must accept StorageBackend | None parameter."""
-        from py_code_mode.execution.protocol import Executor
-        from py_code_mode.storage.backends import StorageBackend
-
-        # Get type hints for start method, providing StorageBackend for forward reference
-        hints = get_type_hints(Executor.start, globalns={"StorageBackend": StorageBackend})
-
-        # Should have 'storage' parameter that accepts StorageBackend | None
-        assert "storage" in hints, "start() must have 'storage' parameter"
-
-        # Check the type annotation includes StorageBackend
-        storage_type = hints["storage"]
-        # Handle Union types (StorageBackend | None)
-        storage_type_str = str(storage_type)
-        assert "StorageBackend" in storage_type_str, (
-            f"start() storage parameter must accept StorageBackend, got {storage_type_str}"
-        )
-
-    def test_protocol_start_is_async(self) -> None:
-        """Executor.start() must be an async method."""
-        import asyncio
-
-        from py_code_mode.execution.protocol import Executor
-
-        # start method should be a coroutine function
-        assert asyncio.iscoroutinefunction(Executor.start), "Executor.start() must be async"
-
-
-class TestStorageBackendAccessDeleted:
-    """Verify StorageBackendAccess class is removed."""
-
-    def test_storage_backend_access_not_in_protocol(self) -> None:
-        """StorageBackendAccess should not exist in protocol module."""
-        from py_code_mode.execution import protocol
-
-        assert not hasattr(protocol, "StorageBackendAccess"), (
-            "StorageBackendAccess should be deleted from protocol.py"
-        )
-
-    def test_storage_access_union_excludes_backend_access(self) -> None:
-        """StorageAccess type should not include StorageBackendAccess."""
-        from py_code_mode.execution.protocol import StorageAccess
-
-        # StorageAccess should only be FileStorageAccess | RedisStorageAccess
-        storage_access_str = str(StorageAccess)
-        assert "StorageBackendAccess" not in storage_access_str, (
-            f"StorageAccess should not include StorageBackendAccess: {storage_access_str}"
-        )
-
-
 # =============================================================================
 # InProcessExecutor Tests
 # =============================================================================
@@ -89,36 +17,6 @@ def test_storage_access_union_excludes_backend_access(self) -> None:
 class TestInProcessExecutorAcceptsStorageBackend:
     """InProcessExecutor.start() must accept StorageBackend directly."""
 
-    def test_start_accepts_storage_backend(self, tmp_path: Path) -> None:
-        """InProcessExecutor.start() accepts StorageBackend parameter."""
-        from py_code_mode.execution.in_process import InProcessExecutor
-        from py_code_mode.storage.backends import FileStorage
-
-        storage = FileStorage(tmp_path)
-        executor = InProcessExecutor()
-
-        # This should NOT raise - executor accepts StorageBackend
-        # Type checker would fail if signature is still StorageAccess
-        import asyncio
-
-        asyncio.run(executor.start(storage=storage))
-
-    def test_start_parameter_named_storage_not_storage_access(self) -> None:
-        """InProcessExecutor.start() parameter must be named 'storage' not 'storage_access'."""
-        import inspect
-
-        from py_code_mode.execution.in_process import InProcessExecutor
-
-        sig = inspect.signature(InProcessExecutor.start)
-        param_names = list(sig.parameters.keys())
-
-        assert "storage" in param_names, (
-            f"start() must have 'storage' parameter, got: {param_names}"
-        )
-        assert "storage_access" not in param_names, (
-            "start() should NOT have 'storage_access' parameter (old name)"
-        )
-
     @pytest.mark.asyncio
     async def test_uses_executor_config_for_tools(self, tmp_path: Path) -> None:
         """InProcessExecutor uses config.tools_path for tools.
@@ -266,22 +164,6 @@ async def test_rejects_redis_storage_access(self) -> None:
 class TestContainerExecutorAcceptsStorageBackend:
     """ContainerExecutor.start() must accept StorageBackend directly."""
 
-    def test_start_parameter_named_storage(self) -> None:
-        """ContainerExecutor.start() parameter must be named 'storage'."""
-        import inspect
-
-        from py_code_mode.execution.container import ContainerExecutor
-
-        sig = inspect.signature(ContainerExecutor.start)
-        param_names = list(sig.parameters.keys())
-
-        assert "storage" in param_names, (
-            f"start() must have 'storage' parameter, got: {param_names}"
-        )
-        assert "storage_access" not in param_names, (
-            "start() should NOT have 'storage_access' parameter (old name)"
-        )
-
     @pytest.mark.asyncio
     async def test_calls_get_serializable_access_for_file_storage(self, tmp_path: Path) -> None:
         """ContainerExecutor calls storage.get_serializable_access() for FileStorage."""
@@ -408,22 +290,6 @@ async def test_rejects_file_storage_access(self, tmp_path: Path) -> None:
 class TestSubprocessExecutorAcceptsStorageBackend:
     """SubprocessExecutor.start() must accept StorageBackend directly."""
 
-    def test_start_parameter_named_storage(self) -> None:
-        """SubprocessExecutor.start() parameter must be named 'storage'."""
-        import inspect
-
-        from py_code_mode.execution.subprocess import SubprocessExecutor
-
-        sig = inspect.signature(SubprocessExecutor.start)
-        param_names = list(sig.parameters.keys())
-
-        assert "storage" in param_names, (
-            f"start() must have 'storage' parameter, got: {param_names}"
-        )
-        assert "storage_access" not in param_names, (
-            "start() should NOT have 'storage_access' parameter (old name)"
-        )
-
     @pytest.mark.asyncio
     async def test_calls_get_serializable_access(self, tmp_path: Path) -> None:
         """SubprocessExecutor calls storage.get_serializable_access().
@@ -513,50 +379,3 @@ async def test_rejects_file_storage_access(self, tmp_path: Path) -> None:
 # =============================================================================
 # Cross-Executor Consistency Tests
 # =============================================================================
-
-
-class TestAllExecutorsHaveConsistentStartSignature:
-    """All executors must have identical start() signatures."""
-
-    def test_all_executors_have_storage_parameter(self) -> None:
-        """All executor start() methods have 'storage' parameter."""
-        import inspect
-
-        from py_code_mode.execution.container import ContainerExecutor
-        from py_code_mode.execution.in_process import InProcessExecutor
-        from py_code_mode.execution.subprocess import SubprocessExecutor
-
-        executors = [
-            ("InProcessExecutor", InProcessExecutor),
-            ("ContainerExecutor", ContainerExecutor),
-            ("SubprocessExecutor", SubprocessExecutor),
-        ]
-
-        for name, executor_cls in executors:
-            sig = inspect.signature(executor_cls.start)
-            param_names = list(sig.parameters.keys())
-            assert "storage" in param_names, (
-                f"{name}.start() must have 'storage' parameter, got: {param_names}"
-            )
-
-    def test_all_executors_storage_defaults_to_none(self) -> None:
-        """All executor start() methods have storage default to None."""
-        import inspect
-
-        from py_code_mode.execution.container import ContainerExecutor
-        from py_code_mode.execution.in_process import InProcessExecutor
-        from py_code_mode.execution.subprocess import SubprocessExecutor
-
-        executors = [
-            ("InProcessExecutor", InProcessExecutor),
-            ("ContainerExecutor", ContainerExecutor),
-            ("SubprocessExecutor", SubprocessExecutor),
-        ]
-
-        for name, executor_cls in executors:
-            sig = inspect.signature(executor_cls.start)
-            storage_param = sig.parameters.get("storage")
-            assert storage_param is not None, f"{name}.start() missing storage parameter"
-            assert storage_param.default is None, (
-                f"{name}.start() storage must default to None, got: {storage_param.default}"
-            )
diff --git a/tests/test_mcp_adapter.py b/tests/test_mcp_adapter.py
index 46f1827..da27bdb 100644
--- a/tests/test_mcp_adapter.py
+++ b/tests/test_mcp_adapter.py
@@ -195,23 +195,6 @@ async def test_call_tool_handles_error_response(self, adapter, mock_session) ->
 class TestMCPAdapterConnection:
     """Tests for MCP server connection management."""
 
-    @pytest.mark.asyncio
-    async def test_connect_to_stdio_server(self) -> None:
-        """Can connect to MCP server via stdio."""
-        from py_code_mode.tools.adapters.mcp import MCPAdapter
-
-        # This test verifies the factory method exists
-        # Actual connection would require a real server
-        assert hasattr(MCPAdapter, "connect_stdio")
-
-    @pytest.mark.asyncio
-    async def test_connect_to_sse_server(self) -> None:
-        """Can connect to MCP server via SSE transport."""
-        from py_code_mode.tools.adapters.mcp import MCPAdapter
-
-        # This test verifies the factory method exists
-        assert hasattr(MCPAdapter, "connect_sse")
-
     @pytest.mark.asyncio
     async def test_close_cleans_up(self) -> None:
         """close() cleans up resources."""
@@ -317,14 +300,6 @@ async def test_connect_sse_initializes_session(self) -> None:
 
             mock_session.initialize.assert_called_once()
 
-    @pytest.mark.asyncio
-    async def test_connect_sse_method_exists(self) -> None:
-        """connect_sse method exists on MCPAdapter."""
-        from py_code_mode.tools.adapters.mcp import MCPAdapter
-
-        assert hasattr(MCPAdapter, "connect_sse")
-        assert callable(MCPAdapter.connect_sse)
-
 
 class TestMCPAdapterNamespacing:
     """Tests for MCP tool namespacing - tools grouped under namespace like CLI tools."""
diff --git a/tests/test_namespace.py b/tests/test_namespace.py
index 78f7b96..23186d0 100644
--- a/tests/test_namespace.py
+++ b/tests/test_namespace.py
@@ -93,7 +93,7 @@ async def communicate(self):
 
     monkeypatch.setattr(asyncio, "create_subprocess_exec", mock_create_subprocess_exec)
 
-    result = await namespace.nmap.syn_scan(target="10.0.0.1")
+    result = namespace.nmap.syn_scan(target="10.0.0.1")
     assert result == "Mock nmap output"
 
 
diff --git a/tests/test_rpc_errors.py b/tests/test_rpc_errors.py
index 97a1918..c302d62 100644
--- a/tests/test_rpc_errors.py
+++ b/tests/test_rpc_errors.py
@@ -312,7 +312,7 @@ async def test_workflow_error_is_namespace_error(self, executor_with_storage) ->
         result = await executor_with_storage.run("issubclass(WorkflowError, NamespaceError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_tool_error_is_namespace_error(self, executor_with_storage) -> None:
@@ -323,7 +323,7 @@ async def test_tool_error_is_namespace_error(self, executor_with_storage) -> Non
         result = await executor_with_storage.run("issubclass(ToolError, NamespaceError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_artifact_error_is_namespace_error(self, executor_with_storage) -> None:
@@ -334,7 +334,7 @@ async def test_artifact_error_is_namespace_error(self, executor_with_storage) ->
         result = await executor_with_storage.run("issubclass(ArtifactError, NamespaceError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_error_is_namespace_error(self, executor_with_storage) -> None:
@@ -345,7 +345,7 @@ async def test_deps_error_is_namespace_error(self, executor_with_storage) -> Non
         result = await executor_with_storage.run("issubclass(DepsError, NamespaceError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_namespace_error_is_rpc_error(self, executor_with_storage) -> None:
@@ -356,7 +356,7 @@ async def test_namespace_error_is_rpc_error(self, executor_with_storage) -> None
         result = await executor_with_storage.run("issubclass(NamespaceError, RPCError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_rpc_error_is_exception(self, executor_with_storage) -> None:
@@ -367,7 +367,7 @@ async def test_rpc_error_is_exception(self, executor_with_storage) -> None:
         result = await executor_with_storage.run("issubclass(RPCError, Exception)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
 
 # =============================================================================
@@ -451,7 +451,7 @@ async def test_rpc_transport_error_is_rpc_error(self, executor_with_storage) ->
         result = await executor_with_storage.run("issubclass(RPCTransportError, RPCError)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_non_dict_error_raises_rpc_transport_error(self, executor_with_storage) -> None:
diff --git a/tests/test_semantic.py b/tests/test_semantic.py
index f59e82d..e62f0fb 100644
--- a/tests/test_semantic.py
+++ b/tests/test_semantic.py
@@ -16,19 +16,6 @@ def _make_workflow(name: str, description: str, code: str) -> PythonWorkflow:
 class TestEmbeddingProviderProtocol:
     """Tests that define the EmbeddingProvider interface."""
 
-    def test_provider_has_embed_method(self) -> None:
-        """Provider must have embed() that returns vectors."""
-        from py_code_mode.workflows import EmbeddingProvider
-
-        # Protocol should define embed method
-        assert hasattr(EmbeddingProvider, "embed")
-
-    def test_provider_has_dimension_property(self) -> None:
-        """Provider exposes embedding dimension for index allocation."""
-        from py_code_mode.workflows import EmbeddingProvider
-
-        assert hasattr(EmbeddingProvider, "dimension")
-
     def test_embed_returns_list_of_vectors(self) -> None:
         """embed() takes list of strings, returns list of float vectors."""
         from py_code_mode.workflows import MockEmbedder
@@ -93,8 +80,6 @@ def test_batch_embedding(self, embedder) -> None:
 
     def test_detects_device(self, embedder) -> None:
         """Uses MPS on Apple Silicon, CUDA if available, else CPU."""
-        # Just verify it has a device attribute
-        assert hasattr(embedder, "device")
         assert embedder.device in ("mps", "cuda", "cpu")
 
 
diff --git a/tests/test_session.py b/tests/test_session.py
index c10c417..d024450 100644
--- a/tests/test_session.py
+++ b/tests/test_session.py
@@ -98,14 +98,14 @@ def storage(self, tmp_path: Path) -> FileStorage:
 
     @pytest.mark.asyncio
     async def test_run_returns_execution_result(self, storage: FileStorage) -> None:
-        """run() returns an ExecutionResult."""
+        """run() returns an ExecutionResult.
+
+        Covered by tests that assert specific `ExecutionResult` behavior (value/stdout/error).
+        """
         async with Session(storage=storage) as session:
             result = await session.run("42")
-
-            assert hasattr(result, "is_ok")
-            assert hasattr(result, "value")
-            assert hasattr(result, "error")
-            assert hasattr(result, "stdout")
+            assert result.error is None
+            assert result.value == 42
 
     @pytest.mark.asyncio
     async def test_run_evaluates_expression(self, storage: FileStorage) -> None:
@@ -435,81 +435,16 @@ def storage(self, tmp_path: Path) -> FileStorage:
     async def test_session_supports_method(self, storage: FileStorage) -> None:
         """Session has supports() method for capability queries."""
         async with Session(storage=storage) as session:
-            # Should have this method
-            assert hasattr(session, "supports")
-            assert callable(session.supports)
+            # Calls through to the active executor.
+            assert isinstance(session.supports("timeout"), bool)
 
     @pytest.mark.asyncio
     async def test_session_supported_capabilities(self, storage: FileStorage) -> None:
         """Session has supported_capabilities() method."""
         async with Session(storage=storage) as session:
-            assert hasattr(session, "supported_capabilities")
             caps = session.supported_capabilities()
             assert isinstance(caps, set)
-
-
-# =============================================================================
-# StorageAccess Type Tests
-# =============================================================================
-
-
-class TestStorageAccessTypes:
-    """Tests for StorageAccess type definitions."""
-
-    def test_file_storage_access_exists(self) -> None:
-        """FileStorageAccess type is importable."""
-        from py_code_mode.execution.protocol import FileStorageAccess
-
-        assert FileStorageAccess is not None
-
-    def test_redis_storage_access_exists(self) -> None:
-        """RedisStorageAccess type is importable."""
-        from py_code_mode.execution.protocol import RedisStorageAccess
-
-        assert RedisStorageAccess is not None
-
-    def test_file_storage_access_has_paths(self) -> None:
-        """FileStorageAccess has workflows_path, artifacts_path.
-
-        NOTE: tools_path and deps_path removed - tools/deps now owned by executors.
-        """
-        from py_code_mode.execution.protocol import FileStorageAccess
-
-        access = FileStorageAccess(
-            workflows_path=Path("/tmp/workflows"),
-            artifacts_path=Path("/tmp/artifacts"),
-        )
-        assert access.workflows_path == Path("/tmp/workflows")
-        assert access.artifacts_path == Path("/tmp/artifacts")
-
-    def test_file_storage_access_paths_optional(self) -> None:
-        """FileStorageAccess allows None for workflows_path.
-
-        NOTE: tools_path and deps_path removed - tools/deps now owned by executors.
-        """
-        from py_code_mode.execution.protocol import FileStorageAccess
-
-        access = FileStorageAccess(
-            workflows_path=None,
-            artifacts_path=Path("/tmp/artifacts"),
-        )
-        assert access.workflows_path is None
-
-    def test_redis_storage_access_has_url_and_prefixes(self) -> None:
-        """RedisStorageAccess has redis_url and prefix fields.
-
-        NOTE: tools_prefix and deps_prefix removed - tools/deps now owned by executors.
-        """
-        from py_code_mode.execution.protocol import RedisStorageAccess
-
-        access = RedisStorageAccess(
-            redis_url="redis://localhost:6379",
-            workflows_prefix="app:workflows",
-            artifacts_prefix="app:artifacts",
-        )
-        assert access.redis_url == "redis://localhost:6379"
-        assert access.workflows_prefix == "app:workflows"
-        assert access.artifacts_prefix == "app:artifacts"
+            assert "timeout" in caps
 
 
 # =============================================================================
@@ -931,17 +866,17 @@ async def run(a: int, b: int) -> int:
             # Verify tools namespace exists
             result = await session.run("'tools' in dir()")
             assert result.is_ok, f"Failed to check tools: {result.error}"
-            assert result.value in (True, "True"), "tools namespace not found"
+            assert result.value is True, "tools namespace not found"
 
             # Verify workflows namespace exists
             result = await session.run("'workflows' in dir()")
             assert result.is_ok, f"Failed to check workflows: {result.error}"
-            assert result.value in (True, "True"), "workflows namespace not found"
+            assert result.value is True, "workflows namespace not found"
 
             # Verify artifacts namespace exists
             result = await session.run("'artifacts' in dir()")
             assert result.is_ok, f"Failed to check artifacts: {result.error}"
-            assert result.value in (True, "True"), "artifacts namespace not found"
+            assert result.value is True, "artifacts namespace not found"
 
             # Verify workflows.list() works and contains our workflow
             result = await session.run("workflows.list()")
@@ -1038,6 +973,6 @@ async def test_process_isolation_implies_serializable_access(self, tmp_path: Pat
             # the subprocess won't be able to reconstruct the storage
             result = await session.run("'artifacts' in dir()")
             assert result.is_ok, f"Failed: {result.error}"
-            assert result.value in (True, "True"), (
+            assert result.value is True, (
                 "artifacts namespace not available - serializable access likely broken"
             )
diff --git a/tests/test_skill_library_vector_store.py b/tests/test_skill_library_vector_store.py
index 2222c1b..50b96f8 100644
--- a/tests/test_skill_library_vector_store.py
+++ b/tests/test_skill_library_vector_store.py
@@ -595,19 +595,6 @@ def test_mock_vector_store_implements_protocol(self) -> None:
         # Should pass isinstance check
         assert isinstance(mock, VectorStore)
 
-    def test_mock_vector_store_has_all_required_methods(self) -> None:
-        """Verify MockVectorStore has all VectorStore methods."""
-        mock = MockVectorStore()
-
-        # All protocol methods should exist
-        assert hasattr(mock, "add")
-        assert hasattr(mock, "remove")
-        assert hasattr(mock, "search")
-        assert hasattr(mock, "get_content_hash")
-        assert hasattr(mock, "get_model_info")
-        assert hasattr(mock, "clear")
-        assert hasattr(mock, "count")
-
 
 class TestWarmStartupCaching:
     """Test that vector_store caching works across library instances."""
diff --git a/tests/test_skill_store.py b/tests/test_skill_store.py
index 798fb6a..b9f7426 100644
--- a/tests/test_skill_store.py
+++ b/tests/test_skill_store.py
@@ -286,9 +286,10 @@ def test_save_and_load_python_workflow(
         assert loaded is not None
         assert loaded.name == "greet"
         assert loaded.description == "Greet someone"
-        # Stored workflows have source and can invoke - duck typing
-        assert hasattr(loaded, "source")
-        assert hasattr(loaded, "invoke")
+        # Stored workflows have source and can invoke.
+        assert isinstance(loaded.source, str)
+        assert loaded.source
+        assert callable(loaded.invoke)
 
     def test_load_nonexistent_returns_none(self, redis_store: RedisWorkflowStore):
         """Should return None for nonexistent workflow."""
diff --git a/tests/test_storage.py b/tests/test_storage.py
index ffefa41..663a022 100644
--- a/tests/test_storage.py
+++ b/tests/test_storage.py
@@ -263,8 +263,8 @@ def test_method_exists_on_file_storage(self, tmp_path: Path) -> None:
             """
             storage = FileStorage(tmp_path)
 
-            assert hasattr(storage, "get_serializable_access")
-            assert callable(storage.get_serializable_access)
+            # Covered by tests that call get_serializable_access() and assert return types.
+            assert storage.get_serializable_access() is not None
 
         def test_method_exists_on_redis_storage(self, mock_redis: MockRedisClient) -> None:
             """RedisStorage has get_serializable_access method.
@@ -273,8 +273,7 @@ def test_method_exists_on_redis_storage(self, mock_redis: MockRedisClient) -> No
             """
             storage = RedisStorage(redis=mock_redis, prefix="test")
 
-            assert hasattr(storage, "get_serializable_access")
-            assert callable(storage.get_serializable_access)
+            assert storage.get_serializable_access() is not None
 
 
 # NOTE: TestStorageBackendExecutionMethods was removed in the executor-ownership refactor.
diff --git a/tests/test_storage_vector_store.py b/tests/test_storage_vector_store.py
index af93e0e..5f34200 100644
--- a/tests/test_storage_vector_store.py
+++ b/tests/test_storage_vector_store.py
@@ -35,15 +35,6 @@
 class TestFileStorageVectorStoreIntegration:
     """Tests for FileStorage vector store integration."""
 
-    def test_get_vector_store_method_exists(self, tmp_path: Path) -> None:
-        """FileStorage has get_vector_store() method.
-
-        Breaks when: Method doesn't exist on FileStorage.
-        """
-        storage = FileStorage(tmp_path)
-        assert hasattr(storage, "get_vector_store")
-        assert callable(storage.get_vector_store)
-
     def test_get_vector_store_returns_chroma_when_available(self, tmp_path: Path) -> None:
         """get_vector_store() returns ChromaVectorStore when chromadb installed.
 
@@ -55,11 +46,10 @@ def test_get_vector_store_returns_chroma_when_available(self, tmp_path: Path) ->
 
         # Should return ChromaVectorStore if chromadb available
         assert vector_store is not None
-        # Check it has VectorStore protocol methods
-        assert hasattr(vector_store, "add")
-        assert hasattr(vector_store, "remove")
-        assert hasattr(vector_store, "search")
-        assert hasattr(vector_store, "count")
+        # Runtime-checkable protocol: ensure it satisfies VectorStore.
+        from py_code_mode.workflows.vector_store import VectorStore
+
+        assert isinstance(vector_store, VectorStore)
 
     def test_get_vector_store_uses_correct_path(self, tmp_path: Path) -> None:
         """get_vector_store() uses {base_path}/vectors/ directory.
@@ -114,18 +104,6 @@ def test_get_vector_store_creates_embedder(self, tmp_path: Path) -> None:
 class TestFileStorageWorkflowLibraryVectorStoreIntegration:
     """Tests for WorkflowLibrary receiving vector_store from FileStorage."""
 
-    def test_workflow_library_has_vector_store_attribute(self, tmp_path: Path) -> None:
-        """WorkflowLibrary created by FileStorage has vector_store attribute.
-
-        Breaks when: create_workflow_library() not called with vector_store parameter.
-        """
-        storage = FileStorage(tmp_path)
-
-        library = storage.get_workflow_library()
-
-        # Should have vector_store attribute
-        assert hasattr(library, "vector_store")
-
     def test_workflow_library_vector_store_matches_get_vector_store(self, tmp_path: Path) -> None:
         """WorkflowLibrary.vector_store is same instance as storage.get_vector_store().
 
@@ -173,15 +151,6 @@ def test_workflow_library_uses_vector_store_for_search(self, tmp_path: Path) ->
 class TestRedisStorageVectorStorePlaceholder:
     """Tests for RedisStorage vector store integration (Phase 6 placeholder)."""
 
-    def test_get_vector_store_method_exists(self, mock_redis: MockRedisClient) -> None:
-        """RedisStorage has get_vector_store() method.
-
-        Breaks when: Method doesn't exist on RedisStorage.
-        """
-        storage = RedisStorage(redis=mock_redis, prefix="test")
-        assert hasattr(storage, "get_vector_store")
-        assert callable(storage.get_vector_store)
-
     def test_get_vector_store_returns_none_for_now(self, mock_redis: MockRedisClient) -> None:
         """get_vector_store() returns None (RedisVectorStore not implemented yet).
 
@@ -204,15 +173,13 @@ class TestFileStorageAccessVectorsPath:
     """Tests for vectors_path field in FileStorageAccess."""
 
     def test_file_storage_access_has_vectors_path_field(self, tmp_path: Path) -> None:
-        """FileStorageAccess has vectors_path field.
-
-        Breaks when: Field doesn't exist in dataclass definition.
-        """
+        """FileStorageAccess has vectors_path field (cross-process config)."""
         storage = FileStorage(tmp_path)
 
         access = storage.get_serializable_access()
 
-        assert hasattr(access, "vectors_path")
+        # Attribute access is the behavior: this will raise AttributeError if missing.
+        _ = access.vectors_path
 
     def test_vectors_path_is_optional(self, tmp_path: Path) -> None:
         """vectors_path can be None when vector store unavailable.
@@ -225,8 +192,7 @@ def test_vectors_path_is_optional(self, tmp_path: Path) -> None:
         with patch.object(storage, "get_vector_store", return_value=None):
             access = storage.get_serializable_access()
 
-        # Should be None when vector store not available
-        # (or set to path if chromadb is available)
+        # Should be None when vector store not available (or set to a Path if available).
         assert access.vectors_path is None or isinstance(access.vectors_path, Path)
 
     def test_vectors_path_points_to_vectors_directory(self, tmp_path: Path) -> None:
@@ -266,15 +232,12 @@ class TestRedisStorageAccessVectorsPrefixPlaceholder:
     def test_redis_storage_access_has_vectors_prefix_field(
         self, mock_redis: MockRedisClient
     ) -> None:
-        """RedisStorageAccess has vectors_prefix field.
-
-        Breaks when: Field doesn't exist in dataclass definition.
-        """
+        """RedisStorageAccess has vectors_prefix field (placeholder for Phase 6)."""
         storage = RedisStorage(redis=mock_redis, prefix="test")
 
         access = storage.get_serializable_access()
 
-        assert hasattr(access, "vectors_prefix")
+        _ = access.vectors_prefix
 
     def test_vectors_prefix_is_optional(self, mock_redis: MockRedisClient) -> None:
         """vectors_prefix can be None when RedisVectorStore not implemented.
@@ -285,7 +248,7 @@ def test_vectors_prefix_is_optional(self, mock_redis: MockRedisClient) -> None:
 
         access = storage.get_serializable_access()
 
-        # Should be None until Phase 6 implements RedisVectorStore
+        # Should be None until Phase 6 implements RedisVectorStore.
         assert access.vectors_prefix is None or isinstance(access.vectors_prefix, str)
 
     def test_vectors_prefix_follows_pattern_when_implemented(
diff --git a/tests/test_storage_wrapper_cleanup.py b/tests/test_storage_wrapper_cleanup.py
index e327995..39e4259 100644
--- a/tests/test_storage_wrapper_cleanup.py
+++ b/tests/test_storage_wrapper_cleanup.py
@@ -256,33 +256,6 @@ class TestStorageBackendProtocolSimplified:
     # NOTE: test_storage_backend_has_get_tool_registry removed
     # tools are now owned by executors, not storage
 
-    def test_storage_backend_has_get_workflow_library(self) -> None:
-        """StorageBackend protocol must have get_workflow_library method.
-
-        Breaks when: Method is missing from protocol.
-        """
-        from py_code_mode.storage.backends import StorageBackend
-
-        assert hasattr(StorageBackend, "get_workflow_library")
-
-    def test_storage_backend_has_get_artifact_store(self) -> None:
-        """StorageBackend protocol must have get_artifact_store method.
-
-        Breaks when: Method is missing from protocol.
-        """
-        from py_code_mode.storage.backends import StorageBackend
-
-        assert hasattr(StorageBackend, "get_artifact_store")
-
-    def test_storage_backend_has_get_serializable_access(self) -> None:
-        """StorageBackend protocol must have get_serializable_access method.
-
-        Breaks when: Method is missing from protocol.
-        """
-        from py_code_mode.storage.backends import StorageBackend
-
-        assert hasattr(StorageBackend, "get_serializable_access")
-
     def test_storage_backend_no_tools_property(self) -> None:
         """StorageBackend protocol must NOT have tools property.
 
diff --git a/tests/test_subprocess_executor.py b/tests/test_subprocess_executor.py
index bcbf47d..492176b 100644
--- a/tests/test_subprocess_executor.py
+++ b/tests/test_subprocess_executor.py
@@ -8,7 +8,7 @@
 
 from py_code_mode.execution.protocol import Capability
 from py_code_mode.execution.subprocess.config import SubprocessConfig
-from py_code_mode.execution.subprocess.venv import KernelVenv, VenvManager
+from py_code_mode.execution.subprocess.venv import VenvManager
 
 
 class TestSubprocessConfig:
@@ -214,76 +214,6 @@ def test_valid_python_version_3_10(self) -> None:
 # =============================================================================
 
 
-class TestKernelVenv:
-    """Tests for KernelVenv dataclass structure."""
-
-    # =========================================================================
-    # Field Existence
-    # =========================================================================
-
-    def test_has_path_field(self, tmp_path: Path) -> None:
-        """KernelVenv has path field."""
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=tmp_path / "venv" / "bin" / "python",
-            kernel_spec_name="test-kernel",
-        )
-        assert hasattr(venv, "path")
-        assert venv.path == tmp_path / "venv"
-
-    def test_has_python_path_field(self, tmp_path: Path) -> None:
-        """KernelVenv has python_path field."""
-        python_path = tmp_path / "venv" / "bin" / "python"
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=python_path,
-            kernel_spec_name="test-kernel",
-        )
-        assert hasattr(venv, "python_path")
-        assert venv.python_path == python_path
-
-    def test_has_kernel_spec_name_field(self, tmp_path: Path) -> None:
-        """KernelVenv has kernel_spec_name field."""
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=tmp_path / "venv" / "bin" / "python",
-            kernel_spec_name="my-kernel-spec",
-        )
-        assert hasattr(venv, "kernel_spec_name")
-        assert venv.kernel_spec_name == "my-kernel-spec"
-
-    # =========================================================================
-    # Type Correctness
-    # =========================================================================
-
-    def test_path_is_path_type(self, tmp_path: Path) -> None:
-        """path field is Path type."""
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=tmp_path / "venv" / "bin" / "python",
-            kernel_spec_name="test-kernel",
-        )
-        assert isinstance(venv.path, Path)
-
-    def test_python_path_is_path_type(self, tmp_path: Path) -> None:
-        """python_path field is Path type."""
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=tmp_path / "venv" / "bin" / "python",
-            kernel_spec_name="test-kernel",
-        )
-        assert isinstance(venv.python_path, Path)
-
-    def test_kernel_spec_name_is_str_type(self, tmp_path: Path) -> None:
-        """kernel_spec_name field is str type."""
-        venv = KernelVenv(
-            path=tmp_path / "venv",
-            python_path=tmp_path / "venv" / "bin" / "python",
-            kernel_spec_name="test-kernel",
-        )
-        assert isinstance(venv.kernel_spec_name, str)
-
-
 # =============================================================================
 # VenvManager Initialization Tests
 # =============================================================================
@@ -1095,13 +1025,13 @@ async def test_start_with_storage_injects_namespaces(self, tmp_path: Path) -> No
 
             # Verify namespaces are injected
             result = await executor.run("'tools' in dir()")
-            assert result.value in (True, "True")
+            assert result.value is True
 
             result = await executor.run("'workflows' in dir()")
-            assert result.value in (True, "True")
+            assert result.value is True
 
             result = await executor.run("'artifacts' in dir()")
-            assert result.value in (True, "True")
+            assert result.value is True
         finally:
             await executor.close()
 
@@ -1566,19 +1496,19 @@ async def test_reset_preserves_injected_namespaces(self, executor) -> None:
         """reset() preserves tools, workflows, artifacts namespaces."""
         # Verify namespaces exist before reset
         result = await executor.run("'tools' in dir()")
-        assert result.value in (True, "True")
+        assert result.value is True
 
         await executor.reset()
 
         # Namespaces should still exist after reset
         result = await executor.run("'tools' in dir()")
-        assert result.value in (True, "True")
+        assert result.value is True
 
         result = await executor.run("'workflows' in dir()")
-        assert result.value in (True, "True")
+        assert result.value is True
 
         result = await executor.run("'artifacts' in dir()")
-        assert result.value in (True, "True")
+        assert result.value is True
 
 
 # =============================================================================
@@ -1736,7 +1666,7 @@ async def test_deps_namespace_is_available(self, executor_with_storage) -> None:
         result = await executor_with_storage.run("'deps' in dir()")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_list_returns_list(self, executor_with_storage) -> None:
@@ -1761,7 +1691,7 @@ async def test_deps_has_add_method(self, executor_with_storage) -> None:
         result = await executor_with_storage.run("callable(deps.add)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_has_remove_method(self, executor_with_storage) -> None:
@@ -1773,7 +1703,7 @@ async def test_deps_has_remove_method(self, executor_with_storage) -> None:
         result = await executor_with_storage.run("callable(deps.remove)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_has_sync_method(self, executor_with_storage) -> None:
@@ -1785,7 +1715,7 @@ async def test_deps_has_sync_method(self, executor_with_storage) -> None:
         result = await executor_with_storage.run("callable(deps.sync)")
 
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_repr_shows_package_count(self, executor_with_storage) -> None:
@@ -1808,14 +1738,14 @@ async def test_reset_preserves_deps_namespace(self, executor_with_storage) -> No
         """
         # Verify deps exists before reset
         result = await executor_with_storage.run("'deps' in dir()")
-        assert result.value in (True, "True")
+        assert result.value is True
 
         await executor_with_storage.reset()
 
         # deps should still exist after reset
         result = await executor_with_storage.run("'deps' in dir()")
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
 
 @pytest.mark.slow
@@ -1906,7 +1836,7 @@ async def test_deps_add_persists_to_store(self, executor_allow_deps) -> None:
         # Verify it's in the list
         result = await executor_allow_deps.run("'requests' in str(deps.list())")
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_deps_add_raises_when_runtime_deps_disabled(self, executor_deny_deps) -> None:
diff --git a/tests/test_subprocess_namespace_injection.py b/tests/test_subprocess_namespace_injection.py
index fd4c8cb..5e956f0 100644
--- a/tests/test_subprocess_namespace_injection.py
+++ b/tests/test_subprocess_namespace_injection.py
@@ -203,7 +203,7 @@ async def test_tools_list_returns_tool_objects(self, executor_with_storage) -> N
 
         # Verify it returns a list
         check_result = await executor_with_storage.run("isinstance(tools.list(), list)")
-        assert check_result.value in (True, "True")
+        assert check_result.value is True
 
         # Verify tools have expected keys (returned as dicts, not objects)
         result = await executor_with_storage.run("[t['name'] for t in tools.list()]")
@@ -318,8 +318,7 @@ async def test_workflows_create_persists(self, executor_empty_storage) -> None:
             "'multiply' in [s['name'] if isinstance(s, dict) else s.name for s in workflows.list()]"
         )
         assert result.error is None
-        # Accept True as bool or string
-        assert result.value in (True, "True"), f"Workflow not found in list: {result.value}"
+        assert result.value is True, f"Workflow not found in list: {result.value}"
 
     @pytest.mark.asyncio
     async def test_workflows_invoke_executes_workflow(self, executor_empty_storage) -> None:
@@ -438,7 +437,7 @@ async def test_artifacts_save_persists_data(self, executor_empty_storage) -> Non
         # Verify exists
         result = await executor_empty_storage.run('artifacts.exists("test_data")')
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_artifacts_load_retrieves_data(self, executor_empty_storage) -> None:
@@ -479,7 +478,7 @@ async def test_artifacts_exists_checks_presence(self, executor_empty_storage) ->
         # Should not exist
         result = await executor_empty_storage.run('artifacts.exists("nonexistent")')
         assert result.error is None
-        assert result.value in (False, "False")
+        assert result.value is False
 
         # Save it
         await executor_empty_storage.run('artifacts.save("now_exists", "data")')
@@ -487,7 +486,7 @@ async def test_artifacts_exists_checks_presence(self, executor_empty_storage) ->
         # Should exist
         result = await executor_empty_storage.run('artifacts.exists("now_exists")')
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
 
 # =============================================================================
@@ -529,7 +528,7 @@ async def test_namespaces_use_storage_paths(self, tmp_path: Path, echo_tool_yaml
             # Tools should be loaded from tools_path (dicts, not objects)
             result = await executor.run("'echo' in [t['name'] for t in tools.list()]")
             assert result.error is None
-            assert result.value in (True, "True")
+            assert result.value is True
         finally:
             await executor.close()
 
@@ -559,7 +558,7 @@ async def test_namespace_state_persists_between_runs(self, executor_empty_storag
             "'counter' in str(workflows.list()) and 'state_test' in str(artifacts.list())"
         )
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
     @pytest.mark.asyncio
     async def test_namespace_state_preserved_after_reset(self, tmp_path: Path) -> None:
@@ -593,14 +592,14 @@ async def test_namespace_state_preserved_after_reset(self, tmp_path: Path) -> No
 
             # Namespaces should still be accessible
             result = await executor.run("'tools' in dir() and 'workflows' in dir()")
-            assert result.value in (True, "True")
+            assert result.value is True
 
             # Persisted data should still be there (it's in storage, not kernel memory)
             result = await executor.run("'persist' in str(workflows.list())")
-            assert result.value in (True, "True")
+            assert result.value is True
 
             result = await executor.run("'persist_artifact' in str(artifacts.list())")
-            assert result.value in (True, "True")
+            assert result.value is True
         finally:
             await executor.close()
 
@@ -637,7 +636,7 @@ async def test_namespaces_available_immediately_after_start(
                 "'tools' in dir() and 'workflows' in dir() and 'artifacts' in dir()"
             )
             assert result.error is None
-            assert result.value in (True, "True")
+            assert result.value is True
         finally:
             await executor.close()
 
@@ -653,7 +652,7 @@ async def test_namespace_objects_are_stable(self, executor_empty_storage) -> Non
         # Check ID is same in next run
         result = await executor_empty_storage.run("id(tools) == _tools_id")
         assert result.error is None
-        assert result.value in (True, "True")
+        assert result.value is True
 
 
 # =============================================================================
@@ -1128,7 +1127,7 @@ async def test_redis_namespace_full_execution(
                 "'tools' in dir() and 'workflows' in dir() and 'artifacts' in dir()"
             )
             assert result.error is None, f"Namespace check failed: {result.error}"
-            assert result.value in (True, "True"), "Namespaces should be available"
+            assert result.value is True, "Namespaces should be available"
 
             # Verify artifacts work with Redis backend
             result = await executor.run('artifacts.save("redis_test", {"from": "redis"}) or True')
diff --git a/tests/test_tool_middleware_plumbing.py b/tests/test_tool_middleware_plumbing.py
new file mode 100644
index 0000000..4da05b0
--- /dev/null
+++ b/tests/test_tool_middleware_plumbing.py
@@ -0,0 +1,173 @@
+from __future__ import annotations
+
+from typing import Any
+
+import pytest
+
+from py_code_mode.tools import ToolCallContext, ToolMiddleware, ToolRegistry
+from py_code_mode.tools.types import Tool, ToolCallable, ToolParameter
+
+
+class _FakeAdapter:
+    def __init__(self, tool_name: str = "echo") -> None:
+        self._tool_name = tool_name
+        self.calls: list[tuple[str, str | None, dict[str, Any]]] = []
+
+    def list_tools(self) -> list[Tool]:
+        return [
+            Tool(
+                name=self._tool_name,
+                description="Echo",
+                callables=(
+                    ToolCallable(
+                        name="say",
+                        description="Say",
+                        parameters=(
+                            ToolParameter(
+                                name="message",
+                                type="str",
+                                required=True,
+                                default=None,
+                                description="msg",
+                            ),
+                        ),
+                    ),
+                ),
+            )
+        ]
+
+    async def call_tool(self, name: str, callable_name: str | None, args: dict[str, Any]) -> Any:
+        self.calls.append((name, callable_name, dict(args)))
+        return {"ok": True, "name": name, "callable": callable_name, "args": dict(args)}
+
+    async def describe(self, tool_name: str, callable_name: str) -> dict[str, str]:
+        return {"message": "msg"}
+
+    async def close(self) -> None:
+        return None
+
+
+@pytest.mark.asyncio
+async def test_tool_middleware_wraps_registry_call_tool() -> None:
+    adapter = _FakeAdapter()
+    registry = ToolRegistry()
+    registry.register_adapter(adapter)  # registers echo
+
+    events: list[str] = []
+
+    class _Recorder(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            events.append(f"pre:{ctx.full_name}:{ctx.executor_type}:{ctx.origin}")
+            out = await call_next(ctx)
+            events.append(f"post:{ctx.full_name}")
+            return out
+
+    registry.apply_tool_middlewares(
+        (_Recorder(),),
+        executor_type="deno-sandbox",
+        origin="deno-sandbox",
+    )
+
+    res = await registry.call_tool("echo", "say", {"message": "hi"})
+    assert res["ok"] is True
+    assert adapter.calls == [("echo", "say", {"message": "hi"})]
+    assert events == [
+        "pre:echo.say:deno-sandbox:deno-sandbox",
+        "post:echo.say",
+    ]
+
+
+@pytest.mark.asyncio
+async def test_tool_middleware_can_rewrite_args() -> None:
+    adapter = _FakeAdapter()
+    registry = ToolRegistry()
+    registry.register_adapter(adapter)
+
+    class _Rewrite(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            ctx.args["message"] = "rewritten"
+            return await call_next(ctx)
+
+    registry.apply_tool_middlewares(
+        (_Rewrite(),),
+        executor_type="deno-sandbox",
+        origin="deno-sandbox",
+    )
+
+    res = await registry.call_tool("echo", "say", {"message": "hi"})
+    assert res["args"]["message"] == "rewritten"
+    assert adapter.calls == [("echo", "say", {"message": "rewritten"})]
+
+
+@pytest.mark.asyncio
+async def test_tool_middleware_can_short_circuit() -> None:
+    from py_code_mode.errors import ToolCallError
+
+    adapter = _FakeAdapter()
+    registry = ToolRegistry()
+    registry.register_adapter(adapter)
+
+    class _Deny(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            raise RuntimeError(f"denied: {ctx.full_name}")
+
+    registry.apply_tool_middlewares((_Deny(),), executor_type="deno-sandbox", origin="deno-sandbox")
+
+    with pytest.raises(ToolCallError, match="denied: echo.say"):
+        await registry.call_tool("echo", "say", {"message": "hi"})
+    assert adapter.calls == []
+
+
+@pytest.mark.asyncio
+async def test_tool_middleware_applies_to_new_adapters_registered_later() -> None:
+    adapter1 = _FakeAdapter("echo1")
+    registry = ToolRegistry()
+    registry.register_adapter(adapter1)
+
+    events: list[str] = []
+
+    class _Recorder(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            events.append(f"pre:{ctx.full_name}")
+            return await call_next(ctx)
+
+    registry.apply_tool_middlewares(
+        (_Recorder(),), executor_type="deno-sandbox", origin="deno-sandbox"
+    )
+
+    # Register a new adapter after middleware is applied.
+    adapter2 = _FakeAdapter("echo2")
+    registry.register_adapter(adapter2)
+
+    res = await registry.call_tool("echo2", "say", {"message": "hi"})
+    assert res["ok"] is True
+    assert events == ["pre:echo2.say"]
+
+
+@pytest.mark.asyncio
+async def test_apply_tool_middlewares_replaces_chain_not_stacks() -> None:
+    adapter = _FakeAdapter()
+    registry = ToolRegistry()
+    registry.register_adapter(adapter)
+
+    events: list[str] = []
+
+    class _RecorderA(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            events.append("A")
+            return await call_next(ctx)
+
+    class _RecorderB(ToolMiddleware):
+        async def __call__(self, ctx: ToolCallContext, call_next):  # type: ignore[override]
+            events.append("B")
+            return await call_next(ctx)
+
+    registry.apply_tool_middlewares(
+        (_RecorderA(),), executor_type="deno-sandbox", origin="deno-sandbox"
+    )
+    registry.apply_tool_middlewares(
+        (_RecorderB(),), executor_type="deno-sandbox", origin="deno-sandbox"
+    )
+
+    await registry.call_tool("echo", "say", {"message": "hi"})
+    assert events == ["B"]
diff --git a/tests/test_tool_proxy_explicit_methods.py b/tests/test_tool_proxy_explicit_methods.py
index 7669cb0..b14c336 100644
--- a/tests/test_tool_proxy_explicit_methods.py
+++ b/tests/test_tool_proxy_explicit_methods.py
@@ -196,14 +196,11 @@ class TestBackwardCompatibility:
 
     @pytest.mark.asyncio
     async def test_dunder_call_still_works_async(self, callable_proxy: CallableProxy) -> None:
-        """__call__ from async context still returns coroutine."""
+        """__call__ from async context still returns a sync result."""
         result = callable_proxy(value="dunder_async")
 
-        # In async context, __call__ returns coroutine
-        assert inspect.iscoroutine(result)
-
-        final = await result
-        assert "testtool.action" in final
+        assert not inspect.iscoroutine(result)
+        assert "testtool.action" in result
 
     def test_dunder_call_still_works_sync(self, callable_proxy: CallableProxy) -> None:
         """__call__ from sync context still returns result."""
diff --git a/tests/test_vector_store.py b/tests/test_vector_store.py
index 188b226..07b9f9a 100644
--- a/tests/test_vector_store.py
+++ b/tests/test_vector_store.py
@@ -11,70 +11,6 @@
 import pytest
 
 
-class TestVectorStoreProtocol:
-    """Protocol compliance tests for VectorStore implementations."""
-
-    def test_vector_store_protocol_exists(self) -> None:
-        """VectorStore protocol should be importable from workflows module."""
-        # Protocol should be runtime checkable
-
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert isinstance(VectorStore, type)
-
-    def test_protocol_has_add_method(self) -> None:
-        """VectorStore must define add() method signature."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        # Protocol defines method signatures at class level
-        assert hasattr(VectorStore, "add")
-
-    def test_protocol_has_remove_method(self) -> None:
-        """VectorStore must define remove() method signature."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "remove")
-
-    def test_protocol_has_search_method(self) -> None:
-        """VectorStore must define search() method signature."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "search")
-
-    def test_protocol_has_get_content_hash_method(self) -> None:
-        """VectorStore must define get_content_hash() for change detection."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "get_content_hash")
-
-    def test_protocol_has_get_model_info_method(self) -> None:
-        """VectorStore must define get_model_info() for model validation."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "get_model_info")
-
-    def test_protocol_has_clear_method(self) -> None:
-        """VectorStore must define clear() to reset index."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "clear")
-
-    def test_protocol_has_count_method(self) -> None:
-        """VectorStore must define count() to get indexed workflow count."""
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        assert hasattr(VectorStore, "count")
-
-    def test_protocol_is_runtime_checkable(self) -> None:
-        """Protocol should support isinstance() checks."""
-
-        from py_code_mode.workflows.vector_store import VectorStore
-
-        # Check that VectorStore has the runtime_checkable marker
-        # This allows isinstance(obj, VectorStore) to work
-        assert hasattr(VectorStore, "__protocol_attrs__") or hasattr(VectorStore, "_is_protocol")
-
-
 class TestModelInfo:
     """Tests for ModelInfo dataclass."""