test(handlers): add PatchAbilities regression coverage

Adds 10 test cases for PATCH /workspaces/:id/abilities: Happy path: - broadcast_enabled=true → 200 - broadcast_enabled=false → 200 - talk_to_user_enabled=true → 200 - both fields in one request → 200 (each UPDATE in order) Input validation: - empty body {} → 400 - non-JSON body → 400 - non-UUID workspace ID → 400 Database errors: - workspace not found → 404 - DB error on existence check → 500 - DB error on broadcast_enabled UPDATE → 500 - DB error on talk_to_user_enabled UPDATE → 500 Covers workspace_abilities.go which was the only unreviewed handler with zero test coverage. No production code changed. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
Merge pull request 'fix(workspace-server): inject /configs token files agent-owned, not root (P0 list_peers 401)' (#1327 ) from fix/workspace-token-injection-agent-owned into main
2026-05-16 14:18:50 +00:00 · 2026-05-16 12:51:57 +00:00 · 2026-05-16 12:05:32 +00:00 · 2026-05-16 10:27:13 +00:00 · 2026-05-16 02:19:11 -07:00
4 changed files with 426 additions and 10 deletions
@@ -177,7 +177,7 @@ func isEnvIdentPart(c byte) bool {
 	return isEnvIdentStart(c) || (c >= '0' && c <= '9')
 }

-// loadWorkspaceEnv reads the org root .env and the workspace-specific .env .env and the workspace-specific .env
+// loadWorkspaceEnv reads the org root .env and the workspace-specific .env
 // (workspace overrides org root). Used by both secret injection and channel
 // config expansion.
 //
@@ -0,0 +1,265 @@
+package handlers
+
+// workspace_abilities_test.go — regression tests for PATCH /workspaces/:id/abilities.
+//
+// The handler toggles two workspace-level ability flags:
+//   broadcast_enabled    — workspace may POST /broadcast to send org-wide messages
+//   talk_to_user_enabled — workspace may deliver canvas chat messages via
+//                          send_message_to_user / POST /notify
+//
+// Gated behind AdminAuth so workspace agents cannot self-modify their own
+// ability flags. These tests cover the uncredentialed unit-path (AdminAuth
+// middleware is tested separately).
+
+import (
+	"bytes"
+	"database/sql"
+	"net/http"
+	"net/http/httptest"
+	"testing"
+
+	"github.com/DATA-DOG/go-sqlmock"
+	"github.com/gin-gonic/gin"
+)
+
+// validUUID is a stable test workspace ID that passes uuid.Parse validation.
+const validUUID = "00000000-0000-0000-0000-000000000001"
+
+// buildAbilitiesCtx wires a gin.Context for PATCH /workspaces/:id/abilities.
+func buildAbilitiesCtx(id string, body string) (*httptest.ResponseRecorder, *gin.Context) {
+	w := httptest.NewRecorder()
+	c, _ := gin.CreateTestContext(w)
+	c.Params = gin.Params{{Key: "id", Value: id}}
+	c.Request = httptest.NewRequest("PATCH", "/workspaces/"+id+"/abilities",
+		bytes.NewBufferString(body))
+	c.Request.Header.Set("Content-Type", "application/json")
+	return w, c
+}
+
+// -------- Happy path --------
+
+// PatchAbilities writes broadcast_enabled=true and returns 200.
+func TestPatchAbilities_BroadcastEnabled_200(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	mock.ExpectExec(`UPDATE workspaces SET broadcast_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, true).
+		WillReturnResult(sqlmock.NewResult(0, 1))
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusOK {
+		t.Errorf("expected 200, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// PatchAbilities writes broadcast_enabled=false and returns 200.
+func TestPatchAbilities_BroadcastEnabledFalse_200(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	mock.ExpectExec(`UPDATE workspaces SET broadcast_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, false).
+		WillReturnResult(sqlmock.NewResult(0, 1))
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":false}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusOK {
+		t.Errorf("expected 200, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// PatchAbilities writes talk_to_user_enabled=true and returns 200.
+func TestPatchAbilities_TalkToUserEnabled_200(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	mock.ExpectExec(`UPDATE workspaces SET talk_to_user_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, true).
+		WillReturnResult(sqlmock.NewResult(0, 1))
+
+	w, c := buildAbilitiesCtx(validUUID, `{"talk_to_user_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusOK {
+		t.Errorf("expected 200, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// Both ability flags in the same request are each written with their own UPDATE.
+func TestPatchAbilities_BothFields_200(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	// broadcast_enabled written first
+	mock.ExpectExec(`UPDATE workspaces SET broadcast_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, true).
+		WillReturnResult(sqlmock.NewResult(0, 1))
+	// talk_to_user_enabled written second
+	mock.ExpectExec(`UPDATE workspaces SET talk_to_user_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, false).
+		WillReturnResult(sqlmock.NewResult(0, 1))
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":true,"talk_to_user_enabled":false}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusOK {
+		t.Errorf("expected 200, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// -------- Input validation --------
+
+// Empty body (neither field) → 400.
+func TestPatchAbilities_NoAbilityFields_400(t *testing.T) {
+	setupTestDB(t)
+	setupTestRedis(t)
+
+	w, c := buildAbilitiesCtx(validUUID, `{}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusBadRequest {
+		t.Errorf("expected 400, got %d: %s", w.Code, w.Body.String())
+	}
+}
+
+// Non-JSON body → 400.
+func TestPatchAbilities_InvalidJSON_400(t *testing.T) {
+	setupTestDB(t)
+	setupTestRedis(t)
+
+	w, c := buildAbilitiesCtx(validUUID, `not json at all`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusBadRequest {
+		t.Errorf("expected 400, got %d: %s", w.Code, w.Body.String())
+	}
+}
+
+// Invalid (non-UUID) workspace ID → 400.
+func TestPatchAbilities_InvalidWorkspaceID_400(t *testing.T) {
+	setupTestDB(t)
+	setupTestRedis(t)
+
+	w, c := buildAbilitiesCtx("not-a-uuid", `{"broadcast_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusBadRequest {
+		t.Errorf("expected 400, got %d: %s", w.Code, w.Body.String())
+	}
+}
+
+// -------- Database errors --------
+
+// Workspace does not exist → 404.
+func TestPatchAbilities_WorkspaceNotFound_404(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(false))
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusNotFound {
+		t.Errorf("expected 404, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// DB error on existence check → 500.
+func TestPatchAbilities_DBErrorOnExistsCheck_500(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnError(sql.ErrConnDone)
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusInternalServerError {
+		t.Errorf("expected 500, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// DB error on broadcast_enabled UPDATE → 500.
+func TestPatchAbilities_DBErrorOnBroadcastUpdate_500(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	mock.ExpectExec(`UPDATE workspaces SET broadcast_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, true).
+		WillReturnError(sql.ErrConnDone)
+
+	w, c := buildAbilitiesCtx(validUUID, `{"broadcast_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusInternalServerError {
+		t.Errorf("expected 500, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
+
+// DB error on talk_to_user_enabled UPDATE → 500.
+func TestPatchAbilities_DBErrorOnTalkToUserUpdate_500(t *testing.T) {
+	mock := setupTestDB(t)
+	setupTestRedis(t)
+
+	mock.ExpectQuery(`SELECT EXISTS\(SELECT 1 FROM workspaces WHERE id = \$1 AND status != 'removed'\)`).
+		WithArgs(validUUID).
+		WillReturnRows(sqlmock.NewRows([]string{"exists"}).AddRow(true))
+	mock.ExpectExec(`UPDATE workspaces SET talk_to_user_enabled = \$2, updated_at = now\(\) WHERE id = \$1`).
+		WithArgs(validUUID, true).
+		WillReturnError(sql.ErrConnDone)
+
+	w, c := buildAbilitiesCtx(validUUID, `{"talk_to_user_enabled":true}`)
+	PatchAbilities(c)
+
+	if w.Code != http.StatusInternalServerError {
+		t.Errorf("expected 500, got %d: %s", w.Code, w.Body.String())
+	}
+	if err := mock.ExpectationsWereMet(); err != nil {
+		t.Errorf("unmet sqlmock expectations: %v", err)
+	}
+}
@@ -189,6 +189,24 @@ const containerNamePrefix = "ws-"
 // (the wiped-DB case after `docker compose down -v`).
 const LabelManaged = "molecule.platform.managed"

+// AgentUID / AgentGID are the uid/gid of the unprivileged `agent` user that
+// every workspace template creates and drops to via `gosu agent` before
+// exec'ing the runtime (the a2a_mcp_server runs under this uid). The value is
+// fixed at 1000:1000 across all templates — see:
+//   - workspace-configs-templates/claude-code-default/Dockerfile (`useradd -u 1000 ... agent`)
+//   - workspace-configs-templates/hermes/Dockerfile               (`useradd -u 1000 ... agent`)
+//   - workspace/entrypoint.sh                                     (`exec gosu agent` — "uid 1000")
+//
+// Files the platform injects into /configs AFTER the entrypoint's
+// `chown -R agent:agent /configs` (the post-start #418 re-injection and the
+// pre-start #1877 volume write) must be owned by this uid/gid, otherwise the
+// agent-uid MCP server hits EACCES reading /configs/.auth_token, sends an
+// empty bearer, and the platform 401s on /registry/{id}/peers (list_peers).
+const (
+	AgentUID = 1000
+	AgentGID = 1000
+)
+
 // managedLabels is the canonical label map applied to every workspace
 // container + volume. Pulled out so a future addition (e.g. instance
 // UUID for multi-platform-shared-daemon disambiguation) is one edit.
@@ -862,8 +880,18 @@ func buildTemplateTar(templatePath string) (*bytes.Buffer, error) {
 	return &buf, nil
 }

-// WriteFilesToContainer writes in-memory files into /configs in the container.
-func (p *Provisioner) WriteFilesToContainer(ctx context.Context, containerID string, files map[string][]byte) error {
+// buildConfigFilesTar builds the tar stream that WriteFilesToContainer streams
+// into /configs via CopyToContainer. Every entry is stamped Uid/Gid = agent
+// (AgentUID/AgentGID) so the files land agent-owned after extraction. This is
+// the issue #418 post-start re-injection path: it runs AFTER the template
+// entrypoint's `chown -R agent:agent /configs`, so without explicit ownership
+// in the tar header the files extract as root:root (tar Uid/Gid default 0) and
+// the agent-uid MCP server can no longer read /configs/.auth_token (and
+// /configs/.platform_inbound_secret) → empty bearer → list_peers 401.
+//
+// Pulled out as a pure function so the ownership contract is unit-testable
+// without a live Docker daemon (mirrors buildTemplateTar).
+func buildConfigFilesTar(files map[string][]byte) (*bytes.Buffer, error) {
 	var buf bytes.Buffer
 	tw := tar.NewWriter(&buf)

@@ -876,8 +904,10 @@ func (p *Provisioner) WriteFilesToContainer(ctx context.Context, containerID str
 				Typeflag: tar.TypeDir,
 				Name:     dir + "/",
 				Mode:     0755,
+				Uid:      AgentUID,
+				Gid:      AgentGID,
 			}); err != nil {
-				return fmt.Errorf("failed to write tar dir header for %s: %w", dir, err)
+				return nil, fmt.Errorf("failed to write tar dir header for %s: %w", dir, err)
 			}
 			createdDirs[dir] = true
 		}
@@ -886,19 +916,30 @@ func (p *Provisioner) WriteFilesToContainer(ctx context.Context, containerID str
 			Name: name,
 			Mode: 0644,
 			Size: int64(len(data)),
+			Uid:  AgentUID,
+			Gid:  AgentGID,
 		}
 		if err := tw.WriteHeader(header); err != nil {
-			return fmt.Errorf("failed to write tar header for %s: %w", name, err)
+			return nil, fmt.Errorf("failed to write tar header for %s: %w", name, err)
 		}
 		if _, err := tw.Write(data); err != nil {
-			return fmt.Errorf("failed to write tar data for %s: %w", name, err)
+			return nil, fmt.Errorf("failed to write tar data for %s: %w", name, err)
 		}
 	}
 	if err := tw.Close(); err != nil {
-		return fmt.Errorf("failed to close tar writer: %w", err)
+		return nil, fmt.Errorf("failed to close tar writer: %w", err)
 	}
+	return &buf, nil
+}

-	return p.cli.CopyToContainer(ctx, containerID, "/configs", &buf, container.CopyToContainerOptions{})
+// WriteFilesToContainer writes in-memory files into /configs in the container,
+// agent-owned (see buildConfigFilesTar).
+func (p *Provisioner) WriteFilesToContainer(ctx context.Context, containerID string, files map[string][]byte) error {
+	buf, err := buildConfigFilesTar(files)
+	if err != nil {
+		return err
+	}
+	return p.cli.CopyToContainer(ctx, containerID, "/configs", buf, container.CopyToContainerOptions{})
 }

 // CopyToContainer exposes CopyToContainer from the Docker client for use by other packages.
@@ -988,13 +1029,28 @@ func (p *Provisioner) ReadFromVolume(ctx context.Context, volumeName, filePath s
 	return clean, nil
 }

+// writeAuthTokenVolumeCmd is the shell command the throwaway alpine container
+// runs to seed /vol/.auth_token. alpine runs it as root, so without the
+// explicit `chown 1000:1000` the file stays root:root after the template
+// entrypoint's `chown -R agent:agent /configs` has already run — the agent-uid
+// (AgentUID) MCP server then gets EACCES reading it → empty bearer →
+// list_peers 401. Pulled out as a pure function so the ownership contract is
+// unit-testable without a live Docker daemon. Issue #1877.
+func writeAuthTokenVolumeCmd() string {
+	return fmt.Sprintf(
+		"mkdir -p /vol && printf '%%s' $TOKEN > /vol/.auth_token && chmod 0600 /vol/.auth_token && chown %d:%d /vol/.auth_token",
+		AgentUID, AgentGID,
+	)
+}
+
 // WriteAuthTokenToVolume writes the workspace auth token into the config volume
 // BEFORE the container starts, eliminating the token-injection race window where
 // a restarted container could read a stale token from /configs/.auth_token before
 // WriteFilesToContainer writes the new one. Issue #1877.
 //
 // Uses a throwaway alpine container to write directly to the named volume,
-// bypassing the container lifecycle entirely.
+// bypassing the container lifecycle entirely. The written file is chowned to
+// the agent uid/gid (see writeAuthTokenVolumeCmd).
 func (p *Provisioner) WriteAuthTokenToVolume(ctx context.Context, workspaceID, token string) error {
 	if p == nil || p.cli == nil {
 		return ErrNoBackend
@@ -1002,7 +1058,7 @@ func (p *Provisioner) WriteAuthTokenToVolume(ctx context.Context, workspaceID, t
 	volName := ConfigVolumeName(workspaceID)
 	resp, err := p.cli.ContainerCreate(ctx, &container.Config{
 		Image: "alpine",
-		Cmd:   []string{"sh", "-c", "mkdir -p /vol && printf '%s' $TOKEN > /vol/.auth_token && chmod 0600 /vol/.auth_token"},
+		Cmd:   []string{"sh", "-c", writeAuthTokenVolumeCmd()},
 		Env:   []string{"TOKEN=" + token},
 	}, &container.HostConfig{
 		Binds: []string{volName + ":/vol"},
@@ -0,0 +1,95 @@
+package provisioner
+
+import (
+	"archive/tar"
+	"errors"
+	"io"
+	"strings"
+	"testing"
+)
+
+// These tests pin the P0 fix for the fleet-wide list_peers 401 (Hermes and
+// every other template): the workspace-server token-injection paths wrote
+// /configs/.auth_token (and /configs/.platform_inbound_secret) as root:root
+// AFTER the template entrypoint's `chown -R agent:agent /configs` ran, so the
+// agent-uid (1000) MCP server (a2a_mcp_server, running via `gosu agent`) hit
+// `[Errno 13] Permission denied` reading the bearer → empty bearer → platform
+// 401 on /registry/{id}/peers (the literal tool_list_peers path).
+//
+// The agent uid is 1000:1000, verified from the templates:
+//   - workspace-configs-templates/claude-code-default/Dockerfile: `useradd -u 1000 ... agent`
+//   - workspace-configs-templates/hermes/Dockerfile:               `useradd -u 1000 ... agent`
+//   - workspace/entrypoint.sh / claude-code-default/entrypoint.sh:  `exec gosu agent` ("uid 1000")
+//
+// Both tests assert the real artifact (the tar headers Docker's CopyToContainer
+// honours for ownership, and the literal shell command the throwaway alpine
+// container runs), not a mock that bypasses ownership. They FAIL on pre-fix
+// code (no Uid/Gid in tar headers; no chown in the alpine command → root:root)
+// and PASS post-fix (agent-owned).
+
+// TestWriteFilesToContainerTar_FilesAreAgentOwned covers the issue #418
+// post-start re-injection path (WriteFilesToContainer): the tar it streams
+// into /configs via CopyToContainer must carry Uid/Gid = agent (1000) so the
+// extracted files land agent-readable, not root:root. This is the path that
+// (re)writes BOTH .auth_token and .platform_inbound_secret on a cadence.
+func TestWriteFilesToContainerTar_FilesAreAgentOwned(t *testing.T) {
+	files := map[string][]byte{
+		".auth_token":              []byte("tok-abc123"),
+		".platform_inbound_secret": []byte("inbound-secret-xyz"),
+		"nested/dir/file.txt":      []byte("data"),
+	}
+
+	buf, err := buildConfigFilesTar(files)
+	if err != nil {
+		t.Fatalf("buildConfigFilesTar: %v", err)
+	}
+
+	tr := tar.NewReader(buf)
+	seen := map[string]bool{}
+	for {
+		hdr, err := tr.Next()
+		if errors.Is(err, io.EOF) {
+			break
+		}
+		if err != nil {
+			t.Fatalf("read tar: %v", err)
+		}
+		if _, err := io.Copy(io.Discard, tr); err != nil {
+			t.Fatalf("drain %s: %v", hdr.Name, err)
+		}
+		seen[hdr.Name] = true
+		if hdr.Uid != AgentUID {
+			t.Fatalf("tar entry %q Uid = %d, want %d (agent) — root-owned injection causes the list_peers 401",
+				hdr.Name, hdr.Uid, AgentUID)
+		}
+		if hdr.Gid != AgentGID {
+			t.Fatalf("tar entry %q Gid = %d, want %d (agent)", hdr.Name, hdr.Gid, AgentGID)
+		}
+	}
+
+	for _, want := range []string{".auth_token", ".platform_inbound_secret"} {
+		if !seen[want] {
+			t.Fatalf("tar missing %q (seen: %v)", want, seen)
+		}
+	}
+}
+
+// TestWriteAuthTokenVolumeCmd_ChownsToAgent covers the issue #1877 pre-start
+// volume-write path (WriteAuthTokenToVolume): the throwaway alpine container
+// writes /vol/.auth_token then chmod 0600 but, pre-fix, never chowns it, so it
+// stays root:root (alpine runs the command as root). The literal command must
+// chown the file to the agent uid:gid so the agent-uid MCP server can read it.
+func TestWriteAuthTokenVolumeCmd_ChownsToAgent(t *testing.T) {
+	cmd := writeAuthTokenVolumeCmd()
+
+	if !strings.Contains(cmd, "chmod 0600 /vol/.auth_token") {
+		t.Fatalf("alpine cmd lost the 0600 chmod (regression): %q", cmd)
+	}
+
+	wantChown := "chown 1000:1000 /vol/.auth_token"
+	if !strings.Contains(cmd, wantChown) {
+		t.Fatalf("alpine cmd = %q, missing %q — without it .auth_token stays root:root "+
+			"and the agent-uid MCP server gets EACCES → empty bearer → list_peers 401",
+			cmd, wantChown)
+	}
+}
Author	SHA1	Message	Date
core-be	bce4844b70	test(handlers): add PatchAbilities regression coverage Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 24s Details CI / Detect changes (pull_request) Successful in 23s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 24s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 29s Details E2E Chat / detect-changes (pull_request) Successful in 32s Details E2E Staging Canvas (Playwright) / detect-changes (pull_request) Successful in 31s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 22s Details Harness Replays / detect-changes (pull_request) Successful in 20s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 25s Details qa-review / approved (pull_request) Failing after 32s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 38s Details security-review / approved (pull_request) Failing after 28s Details gate-check-v3 / gate-check (pull_request) Successful in 40s Details sop-checklist / all-items-acked (pull_request) Successful in 34s Details sop-tier-check / tier-check (pull_request) Successful in 28s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m44s Details CI / Python Lint & Test (pull_request) Successful in 8m12s Details E2E Staging Canvas (Playwright) / Canvas tabs E2E (pull_request) Successful in 15s Details Harness Replays / Harness Replays (pull_request) Successful in 12s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Successful in 14s Details CI / Canvas (Next.js) (pull_request) Failing after 18m21s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Failing after 3m53s Details CI / all-required (pull_request) Failing after 18m12s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Failing after 4m3s Details E2E Chat / E2E Chat (pull_request) Failing after 4m12s Details CI / Platform (Go) (pull_request) Failing after 23m10s Details Adds 10 test cases for PATCH /workspaces/:id/abilities: Happy path: - broadcast_enabled=true → 200 - broadcast_enabled=false → 200 - talk_to_user_enabled=true → 200 - both fields in one request → 200 (each UPDATE in order) Input validation: - empty body {} → 400 - non-JSON body → 400 - non-UUID workspace ID → 400 Database errors: - workspace not found → 404 - DB error on existence check → 500 - DB error on broadcast_enabled UPDATE → 500 - DB error on talk_to_user_enabled UPDATE → 500 Covers workspace_abilities.go which was the only unreviewed handler with zero test coverage. No production code changed. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-16 14:18:50 +00:00
devops-engineer	8e754e6b28	Merge pull request 'fix(workspace-server): inject /configs token files agent-owned, not root (P0 list_peers 401)' (#1327 ) from fix/workspace-token-injection-agent-owned into main Block internal-flavored paths / Block forbidden paths (push) Successful in 15s Details CI / Detect changes (push) Successful in 31s Details CI / Shellcheck (E2E scripts) (push) Successful in 39s Details E2E API Smoke Test / detect-changes (push) Successful in 31s Details E2E Chat / detect-changes (push) Successful in 24s Details E2E Staging Canvas (Playwright) / detect-changes (push) Successful in 25s Details E2E Staging SaaS (full lifecycle) / pr-validate (push) Successful in 59s Details Handlers Postgres Integration / detect-changes (push) Successful in 16s Details Harness Replays / detect-changes (push) Successful in 16s Details Runtime PR-Built Compatibility / detect-changes (push) Successful in 32s Details Secret scan / Scan diff for credential-shaped strings (push) Successful in 27s Details CI / Python Lint & Test (push) Successful in 8m25s Details E2E Staging SaaS (full lifecycle) / E2E Staging SaaS (push) Successful in 6m53s Details publish-workspace-server-image / build-and-push (push) Successful in 14m43s Details CI / Canvas (Next.js) (push) Successful in 23m23s Details CI / Platform (Go) (push) Successful in 26m50s Details CI / all-required (push) Successful in 26m43s Details Runtime Pin Compatibility / PyPI-latest install + import smoke (push) Successful in 3m22s Details E2E API Smoke Test / E2E API Smoke Test (push) Failing after 7m6s Details E2E Staging Canvas (Playwright) / Canvas tabs E2E (push) Successful in 27s Details E2E Chat / E2E Chat (push) Failing after 12m54s Details Harness Replays / Harness Replays (push) Successful in 9s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (push) Successful in 3m3s Details Handlers Postgres Integration / Handlers Postgres Integration (push) Successful in 7m4s Details lint-continue-on-error-tracking / lint-continue-on-error-tracking (push) Successful in 2m12s Details CI / Canvas Deploy Reminder (push) Successful in 9s Details publish-workspace-server-image / Production auto-deploy (push) Successful in 2m22s Details main-red-watchdog / watchdog (push) Successful in 49s Details Railway pin audit (drift detection) / Audit Railway env vars for drift-prone pins (push) Compensated by status-reaper (workflow has no push: trigger; Gitea 1.22.6 hardcoded-suffix bug — see .gitea/scripts/status-reaper.py) Details gate-check-v3 / gate-check (push) Successful in 50s Details Sweep stale Cloudflare DNS records / Sweep CF orphans (push) Successful in 23s Details ci-required-drift / drift (push) Successful in 1m27s Details Staging SaaS smoke (every 30 min) / Staging SaaS smoke (push) Successful in 4m45s Details Continuous synthetic E2E (staging) / Synthetic E2E against staging (push) Successful in 5m31s Details Sweep stale e2e-* orgs (staging) / Sweep e2e orgs (push) Successful in 16s Details status-reaper / reap (push) Has started running Details gitea-merge-queue / queue (push) Has started running Details Sweep stale Cloudflare Tunnels / Sweep CF tunnels (push) Successful in 32s Details	2026-05-16 12:51:57 +00:00
devops-engineer	8179ff77e9	Merge branch 'main' into fix/workspace-token-injection-agent-owned Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 16s Details CI / Detect changes (pull_request) Successful in 27s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 43s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 58s Details E2E Chat / detect-changes (pull_request) Successful in 59s Details E2E Staging SaaS (full lifecycle) / E2E Staging SaaS (pull_request) Has been skipped Details E2E Staging Canvas (Playwright) / detect-changes (pull_request) Successful in 1m0s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 24s Details Harness Replays / detect-changes (pull_request) Successful in 26s Details E2E Staging SaaS (full lifecycle) / pr-validate (pull_request) Successful in 1m8s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 24s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 29s Details qa-review / approved (pull_request) Failing after 27s Details gate-check-v3 / gate-check (pull_request) Successful in 39s Details security-review / approved (pull_request) Failing after 27s Details sop-checklist / all-items-acked (pull_request) Successful in 19s Details sop-tier-check / tier-check (pull_request) Successful in 22s Details E2E Staging Canvas (Playwright) / Canvas tabs E2E (pull_request) Successful in 11s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m39s Details Harness Replays / Harness Replays (pull_request) Successful in 10s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Successful in 18s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 2m9s Details CI / Python Lint & Test (pull_request) Successful in 7m58s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 6m41s Details E2E Chat / E2E Chat (pull_request) Failing after 8m24s Details CI / Platform (Go) (pull_request) Successful in 16m7s Details CI / Canvas (Next.js) (pull_request) Successful in 16m52s Details CI / all-required (pull_request) Successful in 30m58s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details audit-force-merge / audit (pull_request) Successful in 14s Details	2026-05-16 12:05:32 +00:00
infra-runtime-be	6188c6ddf3	fix(org_helpers): correct duplicate phrase in loadWorkspaceEnv comment Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Blocked by required conditions Details sop-checklist / na-declarations (pull_request) N/A: (none) Details gate-check-v3 / gate-check (pull_request) Waiting to run Details audit-force-merge / audit (pull_request) Has been skipped Details Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 19s Details CI / Detect changes (pull_request) Successful in 19s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 25s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 34s Details E2E Peer Visibility (literal MCP list_peers) / E2E Peer Visibility (pull_request) Successful in 21s Details E2E Staging SaaS (full lifecycle) / E2E Staging SaaS (pull_request) Has been skipped Details E2E Staging Canvas (Playwright) / detect-changes (pull_request) Successful in 37s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 23s Details Harness Replays / detect-changes (pull_request) Successful in 22s Details E2E Staging SaaS (full lifecycle) / pr-validate (pull_request) Successful in 1m0s Details Lint curl status-code capture / Scan workflows for curl status-capture pollution (pull_request) Successful in 24s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m32s Details Lint pre-flip continue-on-error / Verify continue-on-error flips have run-log proof (pull_request) Successful in 1m59s Details lint-mask-pr-atomicity / lint-mask-pr-atomicity (pull_request) Successful in 2m23s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details lint-required-context-exists-in-bp / lint-required-context-exists-in-bp (pull_request) Successful in 2m16s Details Lint workflow YAML (Gitea-1.22.6-hostile shapes) / Lint workflow YAML for Gitea-1.22.6-hostile shapes (pull_request) Successful in 1m58s Details lint-continue-on-error-tracking / lint-continue-on-error-tracking (pull_request) Successful in 3m23s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 1m0s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 38s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 25s Details CI / Python Lint & Test (pull_request) Successful in 7m22s Details qa-review / approved (pull_request) Failing after 31s Details E2E Staging External Runtime / E2E Staging External Runtime (pull_request) Successful in 5m26s Details sop-checklist / all-items-acked (pull_request) Successful in 26s Details security-review / approved (pull_request) Failing after 34s Details sop-tier-check / tier-check (pull_request) Successful in 32s Details Ops Scripts Tests / Ops scripts (unittest) (pull_request) Failing after 1m30s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 6m56s Details CI / Canvas (Next.js) (pull_request) Successful in 19m13s Details CI / Canvas Deploy Reminder (pull_request) Successful in 12s Details CI / Platform (Go) (pull_request) Successful in 20m10s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 8m2s Details CI / all-required (pull_request) Successful in 20m5s Details Harness Replays / Harness Replays (pull_request) Has been cancelled Details E2E Staging Canvas (Playwright) / Canvas tabs E2E (pull_request) Has been cancelled Details The comment had the phrase "the workspace-specific .env" duplicated. Removed the redundant repetition. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-16 10:27:13 +00:00
core-be	f986444dbd	fix(workspace-server): inject /configs token files agent-owned, not root Block internal-flavored paths / Block forbidden paths (pull_request) Failing after 0s Details CI / Platform (Go) (pull_request) Failing after 0s Details CI / Detect changes (pull_request) Failing after 0s Details CI / Shellcheck (E2E scripts) (pull_request) Failing after 0s Details CI / Python Lint & Test (pull_request) Failing after 0s Details CI / all-required (pull_request) Failing after 1s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details E2E API Smoke Test / detect-changes (pull_request) Failing after 0s Details CI / Canvas (Next.js) (pull_request) Failing after 1s Details E2E Staging Canvas (Playwright) / detect-changes (pull_request) Failing after 1s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Has been skipped Details E2E Staging Canvas (Playwright) / Canvas tabs E2E (pull_request) Has been skipped Details E2E Staging SaaS (full lifecycle) / pr-validate (pull_request) Failing after 0s Details E2E Staging SaaS (full lifecycle) / E2E Staging SaaS (pull_request) Has been skipped Details Handlers Postgres Integration / detect-changes (pull_request) Failing after 0s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Has been skipped Details Harness Replays / detect-changes (pull_request) Failing after 0s Details Harness Replays / Harness Replays (pull_request) Has been skipped Details lint-required-no-paths / lint-required-no-paths (pull_request) Failing after 0s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Failing after 0s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Has been skipped Details Secret scan / Scan diff for credential-shaped strings (pull_request) Failing after 0s Details qa-review / approved (pull_request) Failing after 0s Details security-review / approved (pull_request) Failing after 0s Details gate-check-v3 / gate-check (pull_request) Failing after 21s Details sop-tier-check / tier-check (pull_request) Successful in 21s Details lint-mask-pr-atomicity / lint-mask-pr-atomicity (pull_request) Successful in 1m21s Details sop-checklist / all-items-acked (pull_request) acked: 0/7 — missing: comprehensive-testing, local-postgres-e2e, staging-smoke, +4 Details sop-checklist / na-declarations (pull_request) N/A: (none) Details The fleet-wide list_peers 401 (Hermes et al): two workspace-server token-injection paths wrote /configs/.auth_token (and /configs/.platform_inbound_secret) as root:root 0600 AFTER the template entrypoint's `chown -R agent:agent /configs` ran. The a2a_mcp_server runs as the agent uid (1000, via `gosu agent`), so platform_auth.get_token() hit `[Errno 13] Permission denied` → empty bearer → platform 401 on /registry/{id}/peers (the literal tool_list_peers path). PR#23 fixed only the entrypoint dir chown (first boot); it cannot reach the post-entrypoint root re-injection. This covers both injection paths: 1. WriteAuthTokenToVolume (#1877, pre-start): the throwaway alpine container ran chmod 0600 but never chowned — alpine runs as root, so the file stayed root:root. Now `chown 1000:1000 /vol/.auth_token` (0600 preserved). 2. WriteFilesToContainer (#418, post-start re-injection): the tar headers left Uid/Gid unset → CopyToContainer extracted root:root. Now every tar entry is stamped Uid/Gid = agent. This path (re)writes BOTH .auth_token and .platform_inbound_secret, so both are fixed. uid 1000:1000 verified from the templates (claude-code-default + hermes Dockerfile `useradd -u 1000 ... agent`, entrypoint `gosu agent`), exposed as AgentUID/AgentGID constants. Tar-build and alpine-cmd extracted into pure helpers (mirrors buildTemplateTar) so the ownership contract is unit-tested without a live Docker daemon; the test fails on pre-fix root:root and passes post-fix (real tar / real command, not a mock). PR#23's entrypoint chown is unchanged (still correct for the dir + first boot). No feature flag, no backwards-compat shim. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-16 02:19:11 -07:00