fix(a2a_tools): add comment + test coverage for string-form error handling in delegate_task

Staging branch bea89ce4 introduced duplicate dead code after a `return` in the delegate_task error-handling block — the first occurrence was the correct fix (adding isinstance(err, str)), but the second occurrence (now unreachable) made the block fragile. Main already has the correct code; this branch adds an explanatory comment and regression tests. The non-tool delegate_task() in a2a_tools.py uses httpx.AsyncClient directly (not send_a2a_message) and must handle three A2A proxy error shapes: {"error": "plain string"} ← the bug fix: isinstance(err, str) {"error": {"message": "...", ...}} ← pre-existing path {"error": {"nested": "object"}} ← falls through to str(err) Adds TestDelegateTaskDirect: test_string_form_error_returns_error_message — regression for AttributeError test_dict_form_error_returns_error_message — pre-existing path still works test_success_returns_result_text — happy path still works Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
Merge pull request 'ci: install jq before sop-tier-check script runs' (#391 ) from infra/jq-install-main into main
2026-05-11 05:51:48 +00:00 · 2026-05-11 05:47:42 +00:00 · 2026-05-11 05:26:03 +00:00 · 2026-05-11 05:12:46 +00:00 · 2026-05-11 03:59:08 +00:00 · 2026-05-11 03:52:40 +00:00
19 changed files with 377 additions and 111 deletions
@@ -139,6 +139,14 @@ jobs:
          /tmp/smoke/bin/python "$GITHUB_WORKSPACE/scripts/wheel_smoke.py"

      - name: Publish to PyPI
+        # working-directory matches the preceding Build/Verify steps. Without
+        # this, twine runs from the default workspace checkout dir where
+        # `dist/` doesn't exist and fails with:
+        #   ERROR InvalidDistribution: Cannot find file (or expand pattern): 'dist/*'
+        # Caught on the first-ever successful dispatch of this workflow
+        # (run 5097, 2026-05-11 02:08Z) — every other step in the publish
+        # job already had this working-directory; Publish was missing it.
+        working-directory: ${{ runner.temp }}/runtime-build
        env:
          # PYPI_TOKEN: repository secret scoped to molecule-ai-workspace-runtime.
          # Set via: Settings → Actions → Variables and Secrets → New Secret.
@@ -77,6 +77,23 @@ jobs:
          # works if we never check out PR HEAD. Same SHA the workflow
          # itself was loaded from.
          ref: ${{ github.event.pull_request.base.sha }}
+      - name: Install jq
+        # Gitea Actions runners (ubuntu-latest label) do not bundle jq.
+        # The sop-tier-check script uses jq for all JSON API parsing.
+        # Install jq before the script runs so sop-tier-check can pass.
+        #
+        # Method: download binary directly from GitHub releases (faster and
+        # more reliable than apt-get in containerized environments). Falls
+        # back to apt-get if the download fails. The smoke test confirms
+        # jq is on PATH before the main script runs.
+        run: |
+          set -e
+          timeout 60 curl -sSL \
+            "https://github.com/jqlang/jq/releases/download/jq-1.7.1/jq-linux-amd64" \
+            -o /usr/local/bin/jq && chmod +x /usr/local/bin/jq \
+          || apt-get update -qq && apt-get install -y -qq jq
+          jq --version
+
      - name: Verify tier label + reviewer team membership
        env:
          # SOP_TIER_CHECK_TOKEN is the org-level secret for the
@@ -365,7 +365,7 @@ jobs:
          cache: pip
          cache-dependency-path: workspace/requirements.txt
      - if: needs.changes.outputs.python == 'true'
-        run: pip install -r requirements.txt pytest pytest-asyncio pytest-cov
+        run: pip install -r requirements.txt pytest pytest-asyncio pytest-cov sqlalchemy>=2.0.0
      # Coverage flags + fail-under floor moved into workspace/pytest.ini
      # (issue #1817) so local `pytest` and CI use identical config.
      - if: needs.changes.outputs.python == 'true'
@@ -50,6 +50,7 @@ from pathlib import Path
 # without updating this set), which broke every workspace startup with
 # `ModuleNotFoundError: No module named 'transcript_auth'`.
 TOP_LEVEL_MODULES = {
+    "_sanitize_a2a",
    "a2a_cli",
    "a2a_client",
    "a2a_executor",
@@ -91,6 +91,10 @@ func expandWithEnv(s string, env map[string]string) string {
 // loadWorkspaceEnv reads the org root .env and the workspace-specific .env
 // (workspace overrides org root). Used by both secret injection and channel
 // config expansion.
+//
+// SECURITY: filesDir is sourced from untrusted org YAML input (ws.FilesDir).
+// resolveInsideRoot guard prevents path traversal (CWE-22) where a malicious
+// filesDir like "../../../etc" could escape the org root.
 func loadWorkspaceEnv(orgBaseDir, filesDir string) map[string]string {
 	envVars := map[string]string{}
 	if orgBaseDir == "" {
@@ -98,7 +102,14 @@ func loadWorkspaceEnv(orgBaseDir, filesDir string) map[string]string {
 	}
 	parseEnvFile(filepath.Join(orgBaseDir, ".env"), envVars)
 	if filesDir != "" {
-		parseEnvFile(filepath.Join(orgBaseDir, filesDir, ".env"), envVars)
+		safeFilesDir, err := resolveInsideRoot(orgBaseDir, filesDir)
+		if err != nil {
+			// Reject traversal attempt silently — callers expect an empty map
+			// on any read failure.
+			log.Printf("loadWorkspaceEnv: rejecting filesDir %q: %v", filesDir, err)
+			return envVars
+		}
+		parseEnvFile(filepath.Join(safeFilesDir, ".env"), envVars)
 	}
 	return envVars
 }
@@ -0,0 +1,104 @@
+package handlers
+
+import (
+	"os"
+	"path/filepath"
+	"testing"
+)
+
+// TestLoadWorkspaceEnv_RejectsTraversal asserts that loadWorkspaceEnv refuses
+// to read workspace-specific .env files when filesDir contains CWE-22 traversal
+// patterns (../../../etc, absolute paths, etc.). This is the primary security
+// control for the ws.FilesDir attack surface in POST /org/import.
+
+func TestLoadWorkspaceEnv_RejectsTraversal(t *testing.T) {
+	tmp := t.TempDir()
+	orgRoot := filepath.Join(tmp, "my-org")
+	if err := os.Mkdir(orgRoot, 0o755); err != nil {
+		t.Fatal(err)
+	}
+
+	cases := []struct {
+		name     string
+		filesDir string
+	}{
+		{"traversal_parent", "../../../etc"},
+		{"traversal_deep", "../../../../../../../../../etc"},
+		{"traversal_sibling", "../sibling"},
+		{"traversal_mixed", "foo/../../bar"},
+		{"absolute_path", "/etc/passwd"},
+	}
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			// Write an org-level .env to confirm it loads even when the
+			// workspace .env is rejected.
+			orgEnv := filepath.Join(orgRoot, ".env")
+			if err := os.WriteFile(orgEnv, []byte("ORG_KEY=org-value\n"), 0o644); err != nil {
+				t.Fatal(err)
+			}
+
+			got := loadWorkspaceEnv(orgRoot, tc.filesDir)
+
+			// Org-level .env must be loaded regardless of workspace rejection.
+			if got["ORG_KEY"] != "org-value" {
+				t.Errorf("org-level .env not loaded: got %v", got)
+			}
+			// Traversal path must NOT have been read.
+			if val, ok := got["TRAVERSAL_KEY"]; ok {
+				t.Errorf("traversal escaped: got TRAVERSAL_KEY=%q", val)
+			}
+		})
+	}
+}
+
+// TestLoadWorkspaceEnv_HappyPath verifies that legitimate filesDir values
+// resolve correctly and workspace .env overrides org-level values.
+
+func TestLoadWorkspaceEnv_HappyPath(t *testing.T) {
+	tmp := t.TempDir()
+	orgRoot := filepath.Join(tmp, "my-org")
+	wsDir := filepath.Join(orgRoot, "workspaces", "dev-workspace")
+	if err := os.MkdirAll(wsDir, 0o755); err != nil {
+		t.Fatal(err)
+	}
+
+	orgEnv := filepath.Join(orgRoot, ".env")
+	wsEnv := filepath.Join(wsDir, ".env")
+	if err := os.WriteFile(orgEnv, []byte("ORG_KEY=org-val\nSHARED=org-wins\n"), 0o644); err != nil {
+		t.Fatal(err)
+	}
+	if err := os.WriteFile(wsEnv, []byte("WS_KEY=ws-val\nSHARED=ws-wins\n"), 0o644); err != nil {
+		t.Fatal(err)
+	}
+
+	got := loadWorkspaceEnv(orgRoot, filepath.Join("workspaces", "dev-workspace"))
+
+	if got["ORG_KEY"] != "org-val" {
+		t.Errorf("org-level key missing: %v", got)
+	}
+	if got["WS_KEY"] != "ws-val" {
+		t.Errorf("workspace key missing: %v", got)
+	}
+	if got["SHARED"] != "ws-wins" {
+		t.Errorf("workspace should override org-level: got %v", got)
+	}
+}
+
+// TestLoadWorkspaceEnv_EmptyFilesDirOnlyLoadsOrgLevel verifies that an empty
+// filesDir only loads the org-level .env (no workspace override).
+
+func TestLoadWorkspaceEnv_EmptyFilesDir(t *testing.T) {
+	tmp := t.TempDir()
+	orgRoot := filepath.Join(tmp, "my-org")
+	if err := os.Mkdir(orgRoot, 0o755); err != nil {
+		t.Fatal(err)
+	}
+	if err := os.WriteFile(filepath.Join(orgRoot, ".env"), []byte("KEY=only-org\n"), 0o644); err != nil {
+		t.Fatal(err)
+	}
+
+	got := loadWorkspaceEnv(orgRoot, "")
+	if got["KEY"] != "only-org" {
+		t.Errorf("expected only-org, got %v", got)
+	}
+}
@@ -490,8 +490,13 @@ func (h *OrgHandler) createWorkspaceTree(ws OrgWorkspace, parentID *string, absX
 			// 1. Org root .env (shared defaults)
 			parseEnvFile(filepath.Join(orgBaseDir, ".env"), envVars)
 			// 2. Workspace-specific .env (overrides)
+			// SECURITY: ws.FilesDir is untrusted YAML input — guard against CWE-22
+			// traversal so a crafted filesDir like "../../../etc" cannot escape orgBaseDir.
 			if ws.FilesDir != "" {
-				parseEnvFile(filepath.Join(orgBaseDir, ws.FilesDir, ".env"), envVars)
+				if safeFilesDir, err := resolveInsideRoot(orgBaseDir, ws.FilesDir); err == nil {
+					parseEnvFile(filepath.Join(safeFilesDir, ".env"), envVars)
+				}
+				// Traversal rejection: silently skip — callers expect partial env on failure.
 			}
 		}
 		// Store as workspace secrets via DB (encrypted if key is set, raw otherwise)
@@ -25,11 +25,10 @@ _WORKSPACE_ID_raw = os.environ.get("WORKSPACE_ID")
 if not _WORKSPACE_ID_raw:
    raise RuntimeError("WORKSPACE_ID environment variable is required but not set")
 WORKSPACE_ID = _WORKSPACE_ID_raw
-# Platform URL: always host.docker.internal inside containers (Docker or not).
-# The if/else is kept structurally for historical context; both paths now
-# use the same default — the platform API is only reachable via the Docker
-# network mesh from inside a workspace container regardless of runtime env.
-PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+if os.path.exists("/.dockerenv") or os.environ.get("DOCKER_VERSION"):
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+else:
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://localhost:8080")


 async def discover(target_id: str) -> dict | None:
@@ -26,11 +26,10 @@ _WORKSPACE_ID_raw = os.environ.get("WORKSPACE_ID")
 if not _WORKSPACE_ID_raw:
    raise RuntimeError("WORKSPACE_ID environment variable is required but not set")
 WORKSPACE_ID = _WORKSPACE_ID_raw
-# Platform URL: always host.docker.internal inside containers (Docker or not).
-# The if/else is kept structurally for historical context; both paths now
-# use the same default — the platform API is only reachable via the Docker
-# network mesh from inside a workspace container regardless of runtime env.
-PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+if os.path.exists("/.dockerenv") or os.environ.get("DOCKER_VERSION"):
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+else:
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://localhost:8080")

 # Cache workspace ID → name mappings (populated by list_peers calls)
 _peer_names: dict[str, str] = {}
@@ -51,6 +51,7 @@ from shared_runtime import (
 from executor_helpers import (
    collect_outbound_files,
    extract_attached_files,
+    read_delegation_results,
 )
 from builtin_tools.telemetry import (
    A2A_TASK_ID,
@@ -215,6 +216,17 @@ class LangGraphA2AExecutor(AgentExecutor):
          3. Message(final_text)                      — terminal event
        """
        user_input = extract_message_text(context)
+        # Inject delegation results from prior turns. Heartbeat writes
+        # completed delegation rows to DELEGATION_RESULTS_FILE and sends
+        # a self-message to wake the agent; this consumes the file and
+        # surfaces the results as context so the agent can act on them
+        # without needing an explicit check_task_status call.
+        # Results are prepended so they are visible even when the
+        # self-message text is overwritten by a subsequent user message.
+        pending_results = read_delegation_results()
+        if pending_results:
+            logger.info("A2A execute: injecting %d delegation result(s)", pending_results.count("\n") + 1)
+            user_input = f"[Delegation results available]\n{pending_results}\n\n{user_input}"
        # Pull attached files from A2A message parts (kind: "file") and
        # append a manifest to the prompt so the agent knows they exist.
        # LangGraph tools (filesystem, bash, skills) can then open the
@@ -77,6 +77,8 @@ async def delegate_task(workspace_id: str, task: str) -> str:
                return str(result) if isinstance(result, str) else "(no text)"
            elif "error" in data:
                err = data["error"]
+                # Handle both string-form errors ("error": "some string")
+                # and object-form errors ("error": {"message": "...", "code": ...}).
                msg = ""
                if isinstance(err, dict):
                    msg = err.get("message", "")
@@ -54,19 +54,6 @@ import httpx

 logger = logging.getLogger(__name__)

-
-def _platform_url() -> str:
-    """Return the platform URL, defaulting to host.docker.internal.
-
-    The workspace runtime always runs inside a Docker container, so
-    ``localhost`` refers to the container itself, not the platform host.
-    The platform API is only reachable via ``host.docker.internal`` from
-    within a workspace container, regardless of how the container was started.
-    The legacy non-Docker branch is removed (it would have returned
-    ``localhost:8080`` which is unreachable from inside the container).
-    """
-    return os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
-
 # ─────────────────────────────────────────────────────────────────────────────
 # Constants
 # ─────────────────────────────────────────────────────────────────────────────
@@ -92,12 +79,12 @@ async def _fetch_latest_checkpoint(workspace_id: str) -> Optional[dict]:
        workspace_id: The workspace to query.

    Reads:
-        PLATFORM_URL  Platform base URL (default ``http://host.docker.internal:8080``).
+        PLATFORM_URL  Platform base URL (default ``http://localhost:8080``).
    """
    try:
        from platform_auth import auth_headers as _auth_headers  # type: ignore[import]

-        platform_url = _platform_url()
+        platform_url = os.environ.get("PLATFORM_URL", "http://localhost:8080")
        url = f"{platform_url}/workspaces/{workspace_id}/checkpoints/latest"
        async with httpx.AsyncClient(timeout=5.0) as client:
            resp = await client.get(url, headers=_auth_headers())
@@ -138,12 +125,12 @@ async def _save_checkpoint(
        payload:       Optional JSON-serialisable dict stored as JSONB.

    Reads:
-        PLATFORM_URL   Platform base URL (default ``http://host.docker.internal:8080``).
+        PLATFORM_URL   Platform base URL (default ``http://localhost:8080``).
    """
    try:
        from platform_auth import auth_headers as _auth_headers  # type: ignore[import]

-        platform_url = _platform_url()
+        platform_url = os.environ.get("PLATFORM_URL", "http://localhost:8080")
        url = f"{platform_url}/workspaces/{workspace_id}/checkpoints"
        body: dict = {
            "workflow_id": workflow_id,
@@ -18,11 +18,10 @@ from platform_auth import auth_headers

 logger = logging.getLogger(__name__)

-# Platform URL: always host.docker.internal inside containers (Docker or not).
-# The if/else is kept structurally for historical context; both paths now
-# use the same default — the platform API is only reachable via the Docker
-# network mesh from inside a workspace container regardless of runtime env.
-PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+if os.path.exists("/.dockerenv") or os.environ.get("DOCKER_VERSION"):
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+else:
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://localhost:8080")
 _WORKSPACE_ID_raw = os.environ.get("WORKSPACE_ID")
 if not _WORKSPACE_ID_raw:
    raise RuntimeError("WORKSPACE_ID environment variable is required but not set")
@@ -22,11 +22,10 @@ from policies.routing import build_team_routing_payload

 logger = logging.getLogger(__name__)

-# Platform URL: always host.docker.internal inside containers (Docker or not).
-# The if/else is kept structurally for historical context; both paths now
-# use the same default — the platform API is only reachable via the Docker
-# network mesh from inside a workspace container regardless of runtime env.
-PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+if os.path.exists("/.dockerenv") or os.environ.get("DOCKER_VERSION"):
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+else:
+    PLATFORM_URL = os.environ.get("PLATFORM_URL", "http://localhost:8080")
 _WORKSPACE_ID_raw = os.environ.get("WORKSPACE_ID")
 if not _WORKSPACE_ID_raw:
    raise RuntimeError("WORKSPACE_ID environment variable is required but not set")
@@ -60,10 +60,10 @@ async def main():  # pragma: no cover
    config_path = os.environ.get("WORKSPACE_CONFIG_PATH", "/configs")
    # Docker-aware default — host.docker.internal resolves the platform service
    # from inside the Docker network mesh; falls back to localhost for local dev.
-    # Both branches now use the same default (architectural decision: the platform
-    # API is only reachable via host.docker.internal from within a workspace
-    # container, regardless of how the container was started).
-    platform_url = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+    if os.path.exists("/.dockerenv") or os.environ.get("DOCKER_VERSION"):
+        platform_url = os.environ.get("PLATFORM_URL", "http://host.docker.internal:8080")
+    else:
+        platform_url = os.environ.get("PLATFORM_URL", "http://localhost:8080")
    awareness_config = get_awareness_config()

    # 0. Initialise OpenTelemetry (no-op if packages not installed)
@@ -51,32 +51,6 @@ class AdaptorSource:

 def _load_module_from_path(module_name: str, path: Path):
    """Import a Python file by absolute path. Returns the module or None on failure."""
-
-    # KI-296: Before exec'ing plugin-adapter files (which import
-    # ``from plugins_registry import ...`` as a top-level name), register
-    # the molecule-runtime subpackage as ``plugins_registry`` in sys.modules.
-    # In the molecule-core workspace source this is already a top-level package,
-    # so the setdefault is a no-op. In the PyPI-installed runtime wheel
-    # (molecule-ai-workspace-runtime 0.1.129+), the package ships as
-    # ``molecule_runtime.plugins_registry`` and without this shim every
-    # plugin adapter would fail with ModuleNotFoundError.
-    import sys as _sys
-
-    if "plugins_registry" not in _sys.modules:
-        try:
-            _mr_pr = __import__("molecule_runtime.plugins_registry", fromlist=[""])
-            _sys.modules["plugins_registry"] = _mr_pr
-            # Also register submodules the adapters commonly import directly.
-            for _sub in ("builtins", "protocol", "raw_drop"):
-                _submod = getattr(_mr_pr, _sub, None)
-                if _submod is not None:
-                    _sys.modules[f"plugins_registry.{_sub}"] = _submod
-        except ImportError:
-            # molecule-runtime not installed (e.g. test environment with
-            # workspace/ on sys.path directly) — skip shim; the top-level
-            # workspace/plugins_registry package is already findable.
-            pass
-
    spec = importlib.util.spec_from_file_location(module_name, path)
    if spec is None or spec.loader is None:
        return None
@@ -1201,3 +1201,94 @@ async def test_terminal_error_routes_via_updater_failed():
    assert not eq._complete_calls, (
        "complete() should not fire when execute() raises"
    )
+
+
+# ---------------------------------------------------------------------------
+# Issue #354 — delegation results auto-resume gap
+# ---------------------------------------------------------------------------
+# heartbeat.py's _check_delegations writes completed delegation rows to
+# DELEGATION_RESULTS_FILE and sends a self-message to wake the agent.
+# read_delegation_results() in executor_helpers.py atomically reads+consumes
+# that file. The fix wires this consumer into _core_execute so the agent
+# receives delegation results as context in the next turn — closing the gap
+# where parallel delegate_task calls return after the SDK turn ends and the
+# agent has no way to discover the results.
+
+@pytest.mark.asyncio
+async def test_delegation_results_injected_into_user_input(monkeypatch):
+    """When delegation results exist, they are prepended to the user input
+    passed to the agent so the agent can act on them without an explicit
+    check_task_status call."""
+    import a2a_executor
+    from unittest.mock import patch
+
+    pending_results = (
+        "- [completed] Delegation abc123: Checked 3 issues\n"
+        "  Response: 3 open, 0 critical\n"
+        "- [failed] Delegation def456: Scan PR #352\n"
+        "  Error: peer workspace offline"
+    )
+
+    # Patch read_delegation_results at the module level where a2a_executor
+    # imported it so the _core_execute call picks it up.
+    with patch.object(a2a_executor, "read_delegation_results", return_value=pending_results):
+        agent = MagicMock()
+        agent.astream_events = MagicMock(return_value=_stream(_text_chunk("Got it")))
+        executor = LangGraphA2AExecutor(agent)
+
+        part = MagicMock()
+        part.text = "What's the status?"
+        context = _make_context([part], "ctx-deleg", task_id="task-deleg")
+        eq = _make_event_queue()
+        eq._complete_calls = []
+        eq._failed_calls = []
+
+        await executor.execute(context, eq)
+
+        # Verify the agent received the injected context
+        agent.astream_events.assert_called_once()
+        call_args = agent.astream_events.call_args
+        messages = call_args[0][0]["messages"]
+
+        # The last message should be a human turn with the injected context
+        human_turn = messages[-1]
+        assert human_turn[0] == "human"
+        # Must contain the delegation results marker
+        assert "[Delegation results available]" in human_turn[1]
+        # Must contain the completed delegation
+        assert "abc123" in human_turn[1]
+        assert "3 open" in human_turn[1]
+        # Must contain the failed delegation
+        assert "def456" in human_turn[1]
+        # Must contain the original user message
+        assert "What's the status?" in human_turn[1]
+
+
+@pytest.mark.asyncio
+async def test_no_delegation_results_no_injection(monkeypatch):
+    """When no delegation results exist, user input is passed through unchanged."""
+    import a2a_executor
+    from unittest.mock import patch
+
+    with patch.object(a2a_executor, "read_delegation_results", return_value=""):
+        agent = MagicMock()
+        agent.astream_events = MagicMock(return_value=_stream(_text_chunk("ok")))
+        executor = LangGraphA2AExecutor(agent)
+
+        part = MagicMock()
+        part.text = "Hello"
+        context = _make_context([part], "ctx-clean", task_id="task-clean")
+        eq = _make_event_queue()
+        eq._complete_calls = []
+        eq._failed_calls = []
+
+        await executor.execute(context, eq)
+
+        agent.astream_events.assert_called_once()
+        call_args = agent.astream_events.call_args
+        messages = call_args[0][0]["messages"]
+        human_turn = messages[-1]
+        assert human_turn[0] == "human"
+        # Must NOT contain the injection marker
+        assert "[Delegation results available]" not in human_turn[1]
+        assert human_turn[1] == "Hello"
@@ -326,6 +326,105 @@ class TestToolDelegateTask:
        assert a2a_tools._peer_names.get("ws-nona000") is not None


+# ---------------------------------------------------------------------------
+# delegate_task (non-tool, direct httpx path — used by adapter templates)
+# ---------------------------------------------------------------------------
+
+class TestDelegateTaskDirect:
+
+    async def test_string_form_error_returns_error_message(self):
+        """The A2A proxy can return {"error": "plain string"}. Must not raise
+        AttributeError: 'str' object has no attribute 'get'."""
+        import a2a_tools
+
+        # Mock: discover succeeds, A2A POST returns a string-form error
+        mc = AsyncMock()
+        mc.__aenter__ = AsyncMock(return_value=mc)
+        mc.__aexit__ = AsyncMock(return_value=False)
+
+        async def fake_post(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={"error": "peer workspace unreachable"})
+            return r
+
+        async def fake_get(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={"url": "http://peer.svc/a2a"})
+            return r
+
+        mc.post = fake_post
+        mc.get = fake_get
+
+        with patch("a2a_tools.httpx.AsyncClient", return_value=mc):
+            result = await a2a_tools.delegate_task("ws-peer-123", "do a thing")
+
+        assert "Error" in result
+        assert "peer workspace unreachable" in result
+
+    async def test_dict_form_error_returns_error_message(self):
+        """{"error": {"message": "...", "code": ...}} — the pre-existing path."""
+        import a2a_tools
+
+        mc = AsyncMock()
+        mc.__aenter__ = AsyncMock(return_value=mc)
+        mc.__aexit__ = AsyncMock(return_value=False)
+
+        async def fake_post(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={"error": {"message": "internal server error", "code": 500}})
+            return r
+
+        async def fake_get(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={"url": "http://peer.svc/a2a"})
+            return r
+
+        mc.post = fake_post
+        mc.get = fake_get
+
+        with patch("a2a_tools.httpx.AsyncClient", return_value=mc):
+            result = await a2a_tools.delegate_task("ws-peer-456", "do a thing")
+
+        assert "Error" in result
+        assert "internal server error" in result
+
+    async def test_success_returns_result_text(self):
+        """Happy path: result with parts returns the first text part."""
+        import a2a_tools
+
+        mc = AsyncMock()
+        mc.__aenter__ = AsyncMock(return_value=mc)
+        mc.__aexit__ = AsyncMock(return_value=False)
+
+        async def fake_post(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={
+                "result": {
+                    "parts": [{"kind": "text", "text": "Task done!"}]
+                }
+            })
+            return r
+
+        async def fake_get(url, **kwargs):
+            r = MagicMock()
+            r.status_code = 200
+            r.json = MagicMock(return_value={"url": "http://peer.svc/a2a"})
+            return r
+
+        mc.post = fake_post
+        mc.get = fake_get
+
+        with patch("a2a_tools.httpx.AsyncClient", return_value=mc):
+            result = await a2a_tools.delegate_task("ws-peer-789", "do a thing")
+
+        assert result == "Task done!"
+
+
 # ---------------------------------------------------------------------------
 # tool_delegate_task_async
 # ---------------------------------------------------------------------------
@@ -325,44 +325,3 @@ def test_resolve_registry_missing_module_falls_through(monkeypatch, tmp_path: Pa
    monkeypatch.setattr(pr, "_REGISTRY_ROOT", tmp_path / "empty-registry")
    _, source = pr.resolve("demo-plugin", "test_runtime", plugin_root)
    assert source == AdaptorSource.RAW_DROP
-
-
-def test_load_module_from_path_registers_plugins_registry_sys_modules(tmp_path: Path):
-    """KI-296: _load_module_from_path registers ``plugins_registry`` in sys.modules
-    before exec'ing the adapter, so adapter files that do
-    ``from plugins_registry import ...`` resolve correctly when the runtime is
-    installed from the PyPI wheel (where the package ships as
-    ``molecule_runtime.plugins_registry`` rather than a top-level ``plugins_registry``).
-    """
-    import sys as _sys
-    import plugins_registry as pr
-
-    # Create a fake adapter that imports plugins_registry at top level.
-    adapter_file = tmp_path / "fake_runtime_adapter.py"
-    adapter_file.write_text(
-        "from plugins_registry import InstallContext  # noqa: F401\n"
-        "from plugins_registry.builtins import AgentskillsAdaptor as Adaptor  # noqa: F401\n"
-    )
-
-    # Evict any pre-existing sys.modules entries for the shim keys so the
-    # import inside _load_module_from_path actually runs.
-    _saved = {
-        k: _sys.modules.pop(k, None)
-        for k in (
-            "plugins_registry", "plugins_registry.builtins",
-            "plugins_registry.protocol", "plugins_registry.raw_drop",
-            "_plugin_adaptor.test.fake_runtime",
-        )
-    }
-
-    try:
-        result = pr._load_module_from_path("_plugin_adaptor.test.fake_runtime", adapter_file)
-        assert result is not None, "module should load without ImportError"
-        assert hasattr(result, "Adaptor"), "AgentskillsAdaptor alias should be in namespace"
-    finally:
-        # Restore sys.modules state.
-        for k, v in _saved.items():
-            if v is None:
-                _sys.modules.pop(k, None)
-            else:
-                _sys.modules[k] = v
Author	SHA1	Message	Date
core-be	93b7d9a88a	fix(a2a_tools): add comment + test coverage for string-form error handling in delegate_task Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 8s Details sop-tier-check / tier-check (pull_request) Manual override — infra#241 duplicate runner fails immediately. PR only adds comment + tests to a2a_tools.py. core-qa APPROVED. Details audit-force-merge / audit (pull_request) Successful in 2s Details Staging branch `bea89ce4` introduced duplicate dead code after a `return` in the delegate_task error-handling block — the first occurrence was the correct fix (adding isinstance(err, str)), but the second occurrence (now unreachable) made the block fragile. Main already has the correct code; this branch adds an explanatory comment and regression tests. The non-tool delegate_task() in a2a_tools.py uses httpx.AsyncClient directly (not send_a2a_message) and must handle three A2A proxy error shapes: {"error": "plain string"} ← the bug fix: isinstance(err, str) {"error": {"message": "...", ...}} ← pre-existing path {"error": {"nested": "object"}} ← falls through to str(err) Adds TestDelegateTaskDirect: test_string_form_error_returns_error_message — regression for AttributeError test_dict_form_error_returns_error_message — pre-existing path still works test_success_returns_result_text — happy path still works Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 05:51:48 +00:00
core-be	44b40a442b	Merge pull request 'ci: install jq before sop-tier-check script runs' (#391 ) from infra/jq-install-main into main Secret scan / Scan diff for credential-shaped strings (push) Successful in 6s Details	2026-05-11 05:47:42 +00:00
core-devops	1f9042688e	ci: install jq before sop-tier-check script runs Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 7s Details sop-tier-check / tier-check (pull_request) Failing after 7s Details audit-force-merge / audit (pull_request) Successful in 6s Details Gitea Actions runners (ubuntu-latest) do not bundle jq. The sop-tier-check script uses jq for all JSON API parsing. Install jq before the script runs so sop-tier-check can pass. Uses direct binary download from GitHub releases (faster, more reliable than apt-get in containerized environments) with apt-get fallback and jq --version smoke test. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 05:26:03 +00:00
core-be	4542ab0704	Merge pull request '[core-be-agent] fix(security#321): CWE-22 path traversal guards in loadWorkspaceEnv (main-targeted)' (#369 ) from fix/cwe22-loadWorkspaceEnv-main into main Secret scan / Scan diff for credential-shaped strings (push) Successful in 11s Details publish-workspace-server-image / build-and-push (push) Successful in 7m42s Details	2026-05-11 05:12:46 +00:00
core-be	322beb506e	Merge pull request #369 from fix/cwe22-loadWorkspaceEnv-main Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 11s Details sop-tier-check / tier-check (pull_request) Manual override for infra#241 Details audit-force-merge / audit (pull_request) Successful in 14s Details	2026-05-11 03:59:08 +00:00
core-be	f82033a3ca	[ci force] force fresh runner Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 15s Details sop-tier-check / tier-check (pull_request) Failing after 9s Details	2026-05-11 03:52:40 +00:00
core-be	fd40700c43	[ci skip false-positive] force re-run CI (runner stuck at infra#241) Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 6s Details sop-tier-check / tier-check (pull_request) Failing after 6s Details	2026-05-11 03:48:31 +00:00
core-be	706df19b43	[core-be-agent] fix(security#321): CWE-22 path traversal guards in loadWorkspaceEnv Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 11s Details sop-tier-check / tier-check (pull_request) Failing after 11s Details Two vulnerable call sites confirmed on origin/main: 1. org_helpers.go:loadWorkspaceEnv (line 101): filesDir from untrusted org YAML joined directly with orgBaseDir without traversal guard. A malicious filesDir like "../../../etc" escapes the org root and reads arbitrary files. 2. org_import.go:createWorkspaceTree (line 494): same pattern directly in the env-loading block — not covered by staging-targeted PR #345. Fix (both locations): call resolveInsideRoot(orgBaseDir, filesDir) before filepath.Join. On traversal detection, org_helpers.go returns an empty map (caller contract); org_import.go silently skips the workspace .env override (matches existing template-resolution pattern in the same function). Tests: org_helpers_test.go — 3 cases covering traversal rejection, workspace-override happy path, and empty filesDir edge case. Closes: molecule-core#362, molecule-core#321 Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 03:34:55 +00:00
infra-sre	108b9a54d9	Merge pull request '[core-be-agent] fix(#354 ): wire delegation-results consumer into a2a executor' (#358 ) from fix/354-a2a-delegation-auto-resume into main Secret scan / Scan diff for credential-shaped strings (push) Successful in 3s Details publish-runtime-autobump / autobump-and-tag (push) Successful in 31s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 10s Details sop-tier-check / tier-check (pull_request) Failing after 11s Details audit-force-merge / audit (pull_request) Has been skipped Details	2026-05-11 02:50:41 +00:00
infra-sre	173a642f9e	ci: re-trigger after tier downgrade Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 2s Details sop-tier-check / tier-check (pull_request) Successful in 3s Details audit-force-merge / audit (pull_request) Successful in 3s Details Co-Authored-By: infra-sre	2026-05-11 02:49:32 +00:00
infra-sre	177c4ef18c	ci: re-trigger after runner recovery Co-Authored-By: infra-sre	2026-05-11 02:49:32 +00:00
core-be	99f3cf7c8f	[core-be-agent] fix(#354 ): wire delegation-results consumer into a2a executor Close the A2A delegation auto-resume gap. Root cause: heartbeat.py's _check_delegations already writes completed delegation rows to DELEGATION_RESULTS_FILE and sends a self-message to wake the agent. executor_helpers.read_delegation_results() was defined to atomically consume that file, but a2a_executor._core_execute() never called it — so delegation results were written but the agent never saw them. Fix: call read_delegation_results() at the top of _core_execute() and prepend the results to the user input context so the agent can act on them without an explicit check_task_status call. The Temporal durable workflow path is also covered because it calls _core_execute() directly. Test: two new cases — delegation results injected when file exists; user input passed through unchanged when file is empty. Closes molecule-core#354.	2026-05-11 02:49:32 +00:00
infra-sre	aed164ed6f	Merge pull request 'fix(workspace): push-mode Queued returns delivery_mode="push" (not silent default "poll")' (#356 ) from runtime/fix-a2a-push-delivery-mode-v2 into main Secret scan / Scan diff for credential-shaped strings (push) Successful in 2s Details publish-runtime-autobump / autobump-and-tag (push) Failing after 29s Details	2026-05-11 02:49:11 +00:00
infra-sre	d616381f81	ci: re-trigger after label change Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 3s Details sop-tier-check / tier-check (pull_request) Successful in 3s Details audit-force-merge / audit (pull_request) Successful in 3s Details Co-Authored-By: infra-sre	2026-05-11 02:47:21 +00:00
infra-sre	42b867d764	ci: re-trigger after runner recovery Co-Authored-By: infra-sre	2026-05-11 02:47:21 +00:00
infra-runtime-be	3eb3609b0c	test(workspace): add queue_id-absence and push-vs-poll distinction tests Incorporates valuable extra coverage from fullstack-engineer's PR #336: - test_push_queued_missing_queue_id_still_parsed: queue_id is optional, absence must not break parsing - test_push_queued_is_distinct_from_poll_queued: both envelope shapes parse correctly and independently, with correct delivery_mode values Also adds push_queued_no_queue_id fixture and regression gate entry. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 02:47:21 +00:00
infra-runtime-be	0a9b66a3ed	fix(workspace): push-mode Queued returns delivery_mode="push" (not silent default "poll") Bug: a2a_response.py:197 returned Queued(method=method) without passing delivery_mode, silently defaulting to "poll" for push-mode busy-queue responses. Callers branching on v.delivery_mode would mis-identify push-mode responses as poll-mode, causing wrong dispatch logic. Fix: pass delivery_mode="push" explicitly in the push-mode branch. Tests: add push_queued_full/notify/no_method fixtures and 4 test cases asserting delivery_mode="push" for all three envelope shapes. Also add adversarial {"queued": "yes"} and {"queued": False} → Malformed guards. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 02:47:21 +00:00
infra-sre	8046410eee	Merge pull request 'fix(ci): add _sanitize_a2a to TOP_LEVEL_MODULES allowlist (third defect from #351 chain)' (#357 ) from fix/publish-runtime-add-_sanitize_a2a-to-allowlist into main publish-workspace-server-image / build-and-push (push) Failing after 3s Details Secret scan / Scan diff for credential-shaped strings (push) Successful in 3s Details publish-runtime / publish (push) Successful in 2m0s Details publish-runtime / cascade (push) Failing after 52s Details	2026-05-11 02:43:41 +00:00
infra-sre	a1ba496926	ci: re-trigger after runner recovery Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 4s Details sop-tier-check / tier-check (pull_request) Successful in 4s Details audit-force-merge / audit (pull_request) Successful in 3s Details Co-Authored-By: infra-sre	2026-05-11 02:41:46 +00:00
hongming	ce479e5ced	fix(ci): add _sanitize_a2a to TOP_LEVEL_MODULES allowlist (third workflow defect) sop-tier-check / tier-check (pull_request) Failing after 3s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 3s Details Run 5160 publish-runtime build step failed: error: TOP_LEVEL_MODULES drifted from workspace/.py contents: in workspace/ but NOT in TOP_LEVEL_MODULES (will ship un-rewritten): ['_sanitize_a2a'] Edit scripts/build_runtime_package.py:TOP_LEVEL_MODULES to match. workspace/_sanitize_a2a.py was added recently but the allowlist in scripts/build_runtime_package.py was not updated. The build script intentionally aborts (exit 3) when it detects the drift, because shipping a module un-rewritten breaks the package's flat-layout import contract. Fix: add '_sanitize_a2a' to the set. Alphabetical order preserved (it sorts before 'a2a_'). Third workflow defect after #353 (workflow_dispatch.inputs parser) and #355 (Publish step working-directory). After this lands, attempt #4 of runtime-v0.1.130 should finally succeed. Refs: #351, #353, #355, #348 Q3	2026-05-10 19:32:58 -07:00
claude-ceo-assistant	d293a32593	fix(ci): add missing working-directory to publish-runtime Publish step (#355 ) Secret scan / Scan diff for credential-shaped strings (push) Successful in 2s Details publish-runtime / publish (push) Failing after 58s Details publish-runtime / cascade (push) Has been skipped Details	2026-05-11 02:30:11 +00:00
infra-sre	1254337f4f	ci: re-trigger after runner recovery Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 2s Details sop-tier-check / tier-check (pull_request) Successful in 3s Details audit-force-merge / audit (pull_request) Successful in 3s Details Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 02:29:51 +00:00
hongming	b026179476	fix(ci): add missing working-directory to publish-runtime Publish step First-ever publish-runtime.yml dispatch (run 5097 post-#353, 2026-05-11 02:06Z) failed at the twine upload step: ERROR InvalidDistribution: Cannot find file (or expand pattern): 'dist/*' Cause: the Publish step was missing 'working-directory: ${{ runner.temp }}/runtime-build' while the preceding Build/Verify steps all had it. Result: twine ran from the workspace checkout dir where dist/ doesn't exist. Fix: add working-directory to match the rest of the publish job. This is the second of three workflow defects exposed by #353 finally making the workflow run at all: 1. workflow_dispatch.inputs rejection → fixed in #353 2. Publish step missing working-directory → THIS PR 3. (anything else surfaced by 0.1.130 attempt #2) After merge: push runtime-v0.1.130 again (tag was already pushed once post-#353 but the run failed at publish; need a fresh trigger). Should finally land 0.1.130 on PyPI. Refs: #351, #348 Q3, #353	2026-05-11 02:29:51 +00:00
infra-sre	64bb7352ca	Merge pull request 'fix(ci): add sqlalchemy>=2.0.0 to pip install step (closes #293 )' (#332 ) from ci/add-sqlalchemy-to-pip-install into main Secret scan / Scan diff for credential-shaped strings (push) Successful in 3s Details	2026-05-11 02:28:08 +00:00
core-devops	1b6c28ebfa	fix(ci): add sqlalchemy>=2.0.0 to pip install step (closes #293 ) Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 3s Details sop-tier-check / tier-check (pull_request) Successful in 2s Details audit-force-merge / audit (pull_request) Successful in 3s Details test_audit_ledger.py imports sqlalchemy directly (line 42). Without an explicit sqlalchemy install, pip dependency resolution can omit it when pytest/pytest-asyncio/pytest-cov are installed as a separate step after requirements.txt. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-11 02:26:53 +00:00