trigger: re-fire CI all-required sentinel (Gitea 1.22.6 skipped-sentinel rerun; no code change)

The CI / all-required sentinel job was never scheduled in the prior ci.yml run (documented Gitea-1.22/act_runner skipped-sentinel quirk), so it never posted its terminal status and the required context stayed pending. Empty-tree commit is the sanctioned 1.22.6 rerun mechanism — it makes the real sentinel job actually schedule and post its genuine status. No source change.
Merge pull request 'fix(tests)+build: complete secret-scan fixture cleanup for #1420 ' (#1431 ) from runtime/fix-api03-test-fixture into fix/issue212-actionable-agent-error-reason
2026-05-17 17:13:26 +00:00 · 2026-05-17 16:42:01 +00:00 · 2026-05-17 16:34:31 +00:00 · 2026-05-17 16:18:01 +00:00 · 2026-05-17 15:48:31 +00:00 · 2026-05-17 07:56:16 -07:00
5 changed files with 188 additions and 3 deletions
@@ -67,9 +67,21 @@ export function useChatSocket(
            const own = (targetId || msg.workspace_id) === workspaceId;
            if (own) {
              callbacksRef.current.onSendComplete?.();
-              callbacksRef.current.onSendError?.(
-                "Agent error (Exception) — see workspace logs for details.",
-              );
+              // internal#211/#212: surface the runtime's curated,
+              // user-actionable reason (provider HTTP status + error
+              // code + the provider's own guidance, e.g. a 403 "org
+              // disabled · use an API key / ask your admin"). The
+              // server now includes error_detail in the ACTIVITY_LOGGED
+              // broadcast; fall back to summary, and only as a last
+              // resort to a generic line. The old hardcoded
+              // "Agent error (Exception) — see workspace logs for
+              // details." string pointed at a logs UI that does not
+              // exist and discarded the actionable reason entirely.
+              const detail =
+                (p.error_detail as string) ||
+                (p.summary as string) ||
+                "The agent turn failed but the runtime reported no detail. Retry once; if it repeats the workspace runtime may need a restart.";
+              callbacksRef.current.onSendError?.(detail);
            }
          }
        } else if (type === "a2a_send") {
@@ -62,6 +62,7 @@ TOP_LEVEL_MODULES = {
    "a2a_tools_memory",
    "a2a_tools_messaging",
    "a2a_tools_rbac",
+    "a2a_tools_identity",
    "adapter_base",
    "agent",
    "agents_md",
@@ -691,6 +691,19 @@ func logActivityExec(ctx context.Context, exec activityExecutor, broadcaster eve
 		if respStr != nil {
 			payload["response_body"] = json.RawMessage(respJSON)
 		}
+		// internal#211/#212: error_detail carries the runtime's curated,
+		// user-actionable, secret-safe failure reason (provider HTTP
+		// status + error code + the provider's own guidance, e.g. a 403
+		// "org disabled · use an API key / ask your admin"). It is
+		// already persisted to the DB column above and capped by the
+		// runtime's report_activity helper (4096 chars). Previously it
+		// was dropped from the LIVE broadcast, so the canvas had nothing
+		// to render and fell back to a hardcoded opaque
+		// "Agent error (Exception) — see workspace logs" string. Include
+		// it so the chat bubble shows the real reason in real time.
+		if params.ErrorDetail != nil && *params.ErrorDetail != "" {
+			payload["error_detail"] = *params.ErrorDetail
+		}
 	}

 	return func() {
@@ -599,6 +599,28 @@ def _sanitize_for_external(msg: str) -> str:
    import re as _re

    msg = _re.sub(r"(?i)(?:bearer|token|api[_-]?key|sk-)[ :=]+[A-Za-z0-9_/.-]{20,}", "[REDACTED]", msg)
+    # Bare provider key with NO separator after the prefix — a real
+    # `sk-ant-api03-…` / `sk-…` key uses `-` (not `[ :=]`) so the rule
+    # above misses it. Require ≥24 key-ish chars after the `sk-`/`sk-ant-`
+    # prefix so curated examples like `sk-ant-EXAMPLE-SHORT` (13 chars
+    # after `sk-ant-`) still pass through un-redacted.
+    msg = _re.sub(r"(?i)\bsk-(?:ant-)?[A-Za-z0-9_-]{24,}", "[REDACTED]", msg)
+    # JSON-quoted credential values: {"token": "…"} / {"apiKey": "…"} /
+    # {"secret": "…"} / {"password": "…"}. Redact only the value, and only
+    # when it is ≥24 chars so a short curated sample like
+    # `"api_key": "sk-ant-EXAMPLE-SHORT"` (20-char value) still passes.
+    msg = _re.sub(
+        r'(?i)("(?:token|api[_-]?key|secret|password)"\s*:\s*")[^"]{24,}(")',
+        r"\1[REDACTED]\2",
+        msg,
+    )
+    # AWS secret access key in `aws_secret_access_key=…` form (env dumps,
+    # boto tracebacks). The base64-ish value runs until whitespace/quote.
+    msg = _re.sub(
+        r"(?i)(aws_secret_access_key\s*[:=]\s*)\S+",
+        r"\1[REDACTED]",
+        msg,
+    )
    # Absolute paths: /etc/shadow, /home/user/.aws/credentials, etc.
    msg = _re.sub(r"(?:/[^/\s]+){2,}", lambda m: m.group(0) if len(m.group(0)) < 60 else "[REDACTED_PATH]", msg)
    return msg
@@ -608,6 +630,7 @@ def sanitize_agent_error(
    exc: BaseException | None = None,
    category: str | None = None,
    stderr: str | None = None,
+    reason: str | None = None,
 ) -> str:
    """Render an agent-side failure into a user-safe error message.

@@ -615,6 +638,18 @@ def sanitize_agent_error(
    category string (e.g. from `classify_subprocess_error`). If both are
    given, `category` wins. If neither, the tag defaults to "unknown".

+    When ``reason`` is provided (internal#211/#212), it is a *pre-curated,
+    user-actionable, secret-safe* explanation built by the caller from a
+    provider-side failure — e.g. a 403 "Your organization has disabled
+    Claude subscription access · Use an Anthropic API key instead, or ask
+    your admin to enable access" with error code ``oauth_org_not_allowed``.
+    This text is exactly what the user needs to self-serve, so it is
+    surfaced VERBATIM as the message instead of being collapsed to the
+    opaque exception class name. It still passes through the
+    key/token/bearer/path scrubber as a belt-and-braces second pass so a
+    buggy caller can't leak a credential that snuck into the reason.
+    ``reason`` wins over ``stderr``; both lose to neither being set.
+
    When ``stderr`` is provided (e.g. the first ~1 KB of a subprocess stderr
    or HTTP error body), it is sanitized and appended to the output so the
    A2A caller gets actionable context without needing to dig through workspace
@@ -629,6 +664,13 @@ def sanitize_agent_error(
    else:
        tag = "unknown"

+    if reason:
+        # Curated, user-actionable reason — surface it as the message.
+        # Still scrub: a 403/auth/quota message is safe, but the scrubber
+        # is cheap insurance against a caller that didn't curate cleanly.
+        clean = _sanitize_for_external(reason[:_MAX_STDERR_PREVIEW])
+        return f"Agent error ({tag}): {clean}"
+
    if stderr:
        # Truncate and sanitize before including — prevents DoS via
        # a malicious or buggy peer injecting a huge error body, and
@@ -788,6 +788,123 @@ def test_sanitize_agent_error_stderr_combined_with_existing_tests():
    assert "workspace logs" in out


+# ─── reason passthrough (internal#211/#212: surface actionable provider error) ───
+
+
+def test_sanitize_agent_error_reason_surfaced_verbatim():
+    """A curated provider reason is shown to the user, not collapsed to the
+    exception class name. This is the internal#211 regression: a 403
+    org-disabled message must reach the canvas."""
+    reason = (
+        "provider HTTP 403 — oauth_org_not_allowed — Your organization has "
+        "disabled Claude subscription access for Claude Code · Use an "
+        "Anthropic API key instead, or ask your admin to enable access"
+    )
+
+    class _ResultErr(Exception):
+        pass
+
+    out = sanitize_agent_error(exc=_ResultErr("opaque"), reason=reason)
+    # The actionable provider guidance and status code must be visible.
+    assert "403" in out
+    assert "oauth_org_not_allowed" in out
+    assert "disabled Claude subscription access" in out
+    assert "ask your admin to enable access" in out
+    # NOT the old opaque form.
+    assert "see workspace logs" not in out
+
+
+def test_sanitize_agent_error_reason_still_scrubs_secrets():
+    """Even on the reason path the key/token scrubber runs — a buggy caller
+    that lets a bearer token into the reason still gets it redacted."""
+    leaky = (
+        "provider HTTP 401 — auth failed — Authorization: Bearer "
+        "PLACEHOLDER_LONG_TOKEN_0123456789abcdefghijklm please re-auth"
+    )
+    out = sanitize_agent_error(reason=leaky)
+    assert "[REDACTED]" in out
+    assert "PLACEHOLDER_LONG_TOKEN_0123456789abcdefghijklm" not in out
+    # The non-secret guidance still survives the scrub.
+    assert "401" in out
+    assert "please re-auth" in out
+
+
+def test_sanitize_agent_error_reason_scrubs_all_secret_formats():
+    """The scrubber must redact every realistic credential shape — not just
+    the `Bearer <tok>` form the original test happened to exercise
+    (internal#212 review finding: bare `sk-ant-api03-…` keys, JSON-quoted
+    "token"/"apiKey" values, and `aws_secret_access_key=` all leaked).
+    All curated/actionable guidance must still survive the scrub.
+    """
+    # 1. Bare sk-ant-api03 key — no `[ :=]` separator after the prefix
+    #    (a real Anthropic key uses `-`), so the legacy regex missed it.
+    bare = (
+        "provider HTTP 401 — auth failed — invalid key "
+        "sk-FAKEPLACEHOLDERabcdefghijklmnopqrstuvwxy0123456789 "
+        "please re-auth"
+    )
+    out = sanitize_agent_error(reason=bare)
+    assert "sk-FAKEPLACEHOLDERabcdefghijklmnopqrstuvwxy0123456789" not in out
+    assert "[REDACTED]" in out
+    assert "401" in out  # actionable status survives
+    assert "please re-auth" in out  # actionable guidance survives
+
+    # 2. JSON-quoted "token" / "apiKey" values.
+    jblob = (
+        'provider error — config dump {"token": '
+        '"abcDEF0123456789ghIJKL0123456789mnopQRST", "apiKey": '
+        '"anon_fakefakefakefakefakefakefakefakefakefake"} — '
+        "use an API key instead"
+    )
+    out = sanitize_agent_error(reason=jblob)
+    assert "abcDEF0123456789ghIJKL0123456789mnopQRST" not in out
+    assert "anon_fakefakefakefakefakefakefakefakefakefake" not in out
+    assert "[REDACTED]" in out
+    assert "use an API key instead" in out  # actionable guidance survives
+
+    # 3. aws_secret_access_key=… form.
+    awsblob = (
+        "provider HTTP 403 — boto credential error "
+        "aws_secret_access_key=wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY — "
+        "ask your admin to enable access"
+    )
+    out = sanitize_agent_error(reason=awsblob)
+    assert "wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY" not in out
+    assert "[REDACTED]" in out
+    assert "403" in out  # actionable status survives
+    assert "ask your admin to enable access" in out  # guidance survives
+
+    # 4. Regression: the original Bearer form still redacts.
+    # Uses PLACEHOLDER_LONG_TOKEN (>=40 chars, no sk-ant- prefix) to avoid
+    # triggering the secret-scan workflow pattern
+    # `sk-ant-[A-Za-z0-9_-]{40,}`.
+    bearer = (
+        "provider HTTP 401 — Authorization: Bearer "
+        "PLACEHOLDER_LONG_TOKEN_9876543210abcdefghij re-auth"
+    )
+    out = sanitize_agent_error(reason=bearer)
+    assert "PLACEHOLDER_LONG_TOKEN_9876543210abcdefghij" not in out
+    assert "[REDACTED]" in out
+    assert "re-auth" in out
+
+
+def test_sanitize_agent_error_reason_wins_over_stderr():
+    """When both reason and stderr are passed, the curated reason wins."""
+    out = sanitize_agent_error(
+        reason="provider HTTP 403 — use an API key",
+        stderr="raw subprocess noise that should not be shown",
+    )
+    assert "use an API key" in out
+    assert "raw subprocess noise" not in out
+
+
+def test_sanitize_agent_error_no_reason_unchanged():
+    """Omitting reason preserves the original generic behavior."""
+    out = sanitize_agent_error(exc=ValueError("boom"))
+    assert "ValueError" in out
+    assert "workspace logs" in out
+
+

 # ======================================================================
 # classify_subprocess_error
Author	SHA1	Message	Date
fullstack-engineer	878e08c7fc	trigger: re-fire CI all-required sentinel (Gitea 1.22.6 skipped-sentinel rerun; no code change) sop-tier-check / tier-check (pull_request) Waiting to run Details Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 3s Details CI / Detect changes (pull_request) Successful in 6s Details CI / Platform (Go) (pull_request) Successful in 6m24s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 7s Details E2E Chat / detect-changes (pull_request) Successful in 7s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 7s Details Harness Replays / detect-changes (pull_request) Successful in 5s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 56s Details CI / Canvas (Next.js) (pull_request) Successful in 7m57s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 6s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 27s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 5s Details Ops Scripts Tests / Ops scripts (unittest) (pull_request) Successful in 57s Details gate-check-v3 / gate-check (pull_request) Successful in 4s Details qa-review / approved (pull_request) Successful in 4s Details security-review / approved (pull_request) Successful in 3s Details sop-checklist / all-items-acked (pull_request) [info tier:low] acked: 0/7 — missing: comprehensive-testing, local-postgres-e2e, staging-smoke, +4 — body-unfilled: comprehensive-testing, l Details sop-checklist / na-declarations (pull_request) N/A: (none) Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 14s Details E2E Chat / E2E Chat (pull_request) Failing after 1s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 1m2s Details Harness Replays / Harness Replays (pull_request) Successful in 4s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 2m25s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Successful in 2m16s Details CI / Python Lint & Test (pull_request) Successful in 6m42s Details CI / all-required (pull_request) Successful in 1s Details audit-force-merge / audit (pull_request) Successful in 8s Details The CI / all-required sentinel job was never scheduled in the prior ci.yml run (documented Gitea-1.22/act_runner skipped-sentinel quirk), so it never posted its terminal status and the required context stayed pending. Empty-tree commit is the sanctioned 1.22.6 rerun mechanism — it makes the real sentinel job actually schedule and post its genuine status. No source change.	2026-05-17 17:13:26 +00:00
infra-runtime-be	50dea87a9d	Merge pull request 'fix(tests)+build: complete secret-scan fixture cleanup for #1420 ' (#1431 ) from runtime/fix-api03-test-fixture into fix/issue212-actionable-agent-error-reason Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 4s Details CI / Detect changes (pull_request) Successful in 5s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 6s Details E2E Chat / detect-changes (pull_request) Successful in 7s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 9s Details Harness Replays / detect-changes (pull_request) Successful in 4s Details CI / Platform (Go) (pull_request) Successful in 6m5s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 25s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 55s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 5s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 6s Details gate-check-v3 / gate-check (pull_request) Successful in 4s Details qa-review / approved (pull_request) Successful in 5s Details security-review / approved (pull_request) Successful in 6s Details sop-checklist / na-declarations (pull_request) N/A: (none) Details sop-checklist / all-items-acked (pull_request) Successful in 5s Details sop-tier-check / tier-check (pull_request) Successful in 5s Details Ops Scripts Tests / Ops scripts (unittest) (pull_request) Successful in 1m0s Details CI / Canvas (Next.js) (pull_request) Successful in 7m38s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 10s Details E2E Chat / E2E Chat (pull_request) Failing after 2s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 49s Details Harness Replays / Harness Replays (pull_request) Successful in 3s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 1m37s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Successful in 2m11s Details CI / Python Lint & Test (pull_request) Successful in 6m28s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details CI / all-required (pull_request) Successful in 1s Details	2026-05-17 16:42:01 +00:00
infra-runtime-be	335796b0b4	fix(tests): replace remaining sk-ant-api03- fixtures with non-matching tokens Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 3s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 28s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 2s Details gate-check-v3 / gate-check (pull_request) Successful in 3s Details qa-review / approved (pull_request) Successful in 3s Details security-review / approved (pull_request) Successful in 4s Details sop-checklist / na-declarations (pull_request) N/A: (none) Details sop-checklist / all-items-acked (pull_request) Successful in 4s Details sop-tier-check / tier-check (pull_request) Successful in 5s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m3s Details audit-force-merge / audit (pull_request) Successful in 4s Details The secret-scan workflow flags sk-ant-[A-Za-z0-9_-]{40,} patterns. Two sk-ant-api03-* fixture tokens (47 and 62 chars) were present in test_sanitize_agent_error_reason_scrubs_all_secret_formats. They were not replaced by PR #1430 (which only fixed the sk-ant-DEADBEEF* tokens). Replace with tokens that still exercise the same scrubber paths: - BARE sk-* case (≥24 chars after "sk-"): use sk-FAKEPLACEHOLDER... (53 chars total; starts with "sk-" so the bare-pattern scrubber catches it, but lacks "sk-ant-" so the secret-scan pattern does not fire). - JSON-quoted apiKey value (≥24 chars): use anon_fakefakefake... (45 chars; satisfies the JSON-quoted redaction path; does not match any secret-scan credential pattern). Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-17 16:34:31 +00:00
infra-runtime-be	699b5fb275	Merge pull request 'fix(tests)+build: unblock secret scan and Runtime PR-Built on #1420 ' (#1430 ) from runtime/fix-test-fixture-v3 into fix/issue212-actionable-agent-error-reason Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 3s Details CI / Detect changes (pull_request) Successful in 5s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 6s Details E2E Chat / detect-changes (pull_request) Successful in 5s Details Harness Replays / detect-changes (pull_request) Successful in 3s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 5s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details Secret scan / Scan diff for credential-shaped strings (pull_request) Failing after 9s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 12s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 30s Details gate-check-v3 / gate-check (pull_request) Successful in 8s Details qa-review / approved (pull_request) Successful in 7s Details security-review / approved (pull_request) Successful in 5s Details sop-checklist / na-declarations (pull_request) N/A: (none) Details sop-checklist / all-items-acked (pull_request) Successful in 5s Details sop-tier-check / tier-check (pull_request) Successful in 6s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m0s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 12s Details Ops Scripts Tests / Ops scripts (unittest) (pull_request) Successful in 1m6s Details E2E Chat / E2E Chat (pull_request) Failing after 1s Details Harness Replays / Harness Replays (pull_request) Successful in 5s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 2m44s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 2m52s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Successful in 2m32s Details CI / Platform (Go) (pull_request) Successful in 6m41s Details CI / Canvas (Next.js) (pull_request) Successful in 7m19s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details CI / Python Lint & Test (pull_request) Successful in 6m37s Details CI / all-required (pull_request) Successful in 0s Details	2026-05-17 16:18:01 +00:00
infra-runtime-be	fb2fd20c9e	fix(tests)+build: unblock secret scan and Runtime PR-Built on #1420 Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 3s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details Secret scan / Scan diff for credential-shaped strings (pull_request) Successful in 3s Details gate-check-v3 / gate-check (pull_request) Successful in 3s Details qa-review / approved (pull_request) Successful in 4s Details security-review / approved (pull_request) Successful in 3s Details sop-tier-check / tier-check (pull_request) Successful in 3s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 24s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 56s Details sop-checklist / all-items-acked (pull_request) acked: 0/7 — missing: comprehensive-testing, local-postgres-e2e, staging-smoke, +4 Details sop-checklist / na-declarations (pull_request) N/A: (none) Details audit-force-merge / audit (pull_request) Successful in 3s Details Two CI failures blocking PR #1420: 1. Secret scan: `workspace/tests/test_executor_helpers.py` contains two `sk-ant-DEADBEEF...` fixtures matching `sk-ant-[A-Za-z0-9_-]{40,}`. Replaced both with PLACEHOLDER_LONG_TOKEN_... (≥40 chars, no sk-ant- prefix — scrubber path still exercised). 2. Runtime PR-Built: `workspace/a2a_tools_identity.py` missing from TOP_LEVEL_MODULES in scripts/build_runtime_package.py, causing build failure with "TOP_LEVEL_MODULES drifted". Added it. Both fixes verified locally: - pytest affected tests: 3/3 PASSED - build_runtime_package.py: builds cleanly Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-05-17 15:48:31 +00:00
fullstack-engineer	7d2eaa3748	harden(runtime): scrub bare sk-ant keys, JSON-quoted token/apiKey, aws_secret_access_key in _sanitize_for_external Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 11s Details CI / Detect changes (pull_request) Successful in 12s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 11s Details E2E Chat / detect-changes (pull_request) Successful in 12s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 12s Details Harness Replays / detect-changes (pull_request) Successful in 7s Details publish-runtime-autobump / pr-validate (pull_request) Successful in 35s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m5s Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 10s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Failing after 9s Details gate-check-v3 / gate-check (pull_request) Successful in 7s Details security-review / approved (pull_request) Successful in 9s Details qa-review / approved (pull_request) Successful in 10s Details sop-checklist / na-declarations (pull_request) N/A: (none) Details sop-checklist / all-items-acked (pull_request) Successful in 7s Details sop-tier-check / tier-check (pull_request) Successful in 9s Details CI / Platform (Go) (pull_request) Successful in 10m22s Details CI / Canvas (Next.js) (pull_request) Successful in 10m48s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 3s Details E2E Chat / E2E Chat (pull_request) Failing after 3s Details Harness Replays / Harness Replays (pull_request) Successful in 1s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 54s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Failing after 43s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 1m56s Details CI / Python Lint & Test (pull_request) Successful in 6m40s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details CI / all-required (pull_request) Successful in 1s Details Addresses internal#212 PR#1420 dual-review SECURITY finding (infra-sre / infra-runtime-be): _sanitize_for_external missed three real credential shapes because the legacy regex requires a `[ :=]+` separator after the prefix: - bare `sk-ant-api03-…` keys (real key uses `-`, not `[ :=]`) - JSON-quoted "token"/"apiKey"/"secret"/"password" values - `aws_secret_access_key=…` Added three narrowly-scoped regexes (length thresholds tuned so curated short examples like `sk-ant-EXAMPLE-SHORT` / `ghp_SHORT_TOKEN` and all actionable auth/quota/HTTP guidance still pass through). Extended the unit test with test_sanitize_agent_error_reason_scrubs_all_secret_formats asserting redaction for all three new formats plus the original Bearer regression. Full sanitize suite green; existing passthrough assertions unchanged. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-17 07:56:16 -07:00
fullstack-engineer	44b78e28c8	fix(runtime+canvas): surface actionable provider error reason instead of opaque "Agent error (Exception)" CI / all-required (pull_request) Blocked by required conditions Details Block internal-flavored paths / Block forbidden paths (pull_request) Successful in 4s Details CI / Detect changes (pull_request) Successful in 9s Details E2E API Smoke Test / detect-changes (pull_request) Successful in 12s Details E2E Chat / detect-changes (pull_request) Successful in 10s Details Harness Replays / detect-changes (pull_request) Successful in 7s Details Handlers Postgres Integration / detect-changes (pull_request) Successful in 10s Details publish-runtime-autobump / bump-and-tag (pull_request) Has been skipped Details Runtime PR-Built Compatibility / detect-changes (pull_request) Successful in 11s Details Secret scan / Scan diff for credential-shaped strings (pull_request) Failing after 6s Details gate-check-v3 / gate-check (pull_request) Successful in 6s Details qa-review / approved (pull_request) Successful in 6s Details security-review / approved (pull_request) Successful in 6s Details sop-checklist / na-declarations (pull_request) N/A: (none) Details publish-runtime-autobump / pr-validate (pull_request) Successful in 33s Details sop-checklist / all-items-acked (pull_request) Successful in 6s Details sop-tier-check / tier-check (pull_request) Successful in 6s Details CI / Shellcheck (E2E scripts) (pull_request) Successful in 2s Details lint-required-no-paths / lint-required-no-paths (pull_request) Successful in 1m9s Details E2E Chat / E2E Chat (pull_request) Failing after 13s Details Harness Replays / Harness Replays (pull_request) Successful in 2s Details Runtime PR-Built Compatibility / PR-built wheel + import smoke (pull_request) Failing after 55s Details E2E API Smoke Test / E2E API Smoke Test (pull_request) Successful in 2m38s Details Handlers Postgres Integration / Handlers Postgres Integration (pull_request) Successful in 2m38s Details CI / Platform (Go) (pull_request) Successful in 7m2s Details CI / Python Lint & Test (pull_request) Successful in 6m39s Details CI / Canvas (Next.js) (pull_request) Successful in 7m56s Details CI / Canvas Deploy Reminder (pull_request) Has been skipped Details internal#212 (P0 from internal#211). When the embedded `claude` CLI emits a terminal result message with is_error=true (e.g. 403 oauth_org_not_allowed "Your organization has disabled Claude subscription access · Use an Anthropic API key instead, or ask your admin to enable access"), the user saw only `Agent error (Exception) — see workspace logs for details.` — a dead end (no such logs UI) that discards the exact secret-safe, actionable text the user needs. Root cause was a multi-cut loss of the CLI's result/error/api_error_status: cut #2 sanitize_agent_error reduced every failure to type(exc).__name__. → add a `reason` passthrough: a pre-curated, user-actionable, secret-safe explanation is surfaced verbatim (still scrubbed for key/token/bearer as a second pass). reason wins over stderr; omitting it preserves the prior generic behavior exactly. cut #3a workspace-server dropped error_detail from the live ACTIVITY_LOGGED websocket broadcast (it was persisted to the DB column but never sent), so the canvas had nothing to render. → include error_detail in the broadcast payload (already capped at 4096 by the runtime's report_activity helper). cut #3b canvas useChatSocket hardcoded the opaque string, ignoring even the activity summary. → render error_detail (fallback: summary, then a generic retry hint). The dead "see workspace logs for details." phrase that pointed at nonexistent UI is removed (a full logs tab is a separate larger follow-up, not this PR — reason-first per CTO). The runtime-side cut #1 (template-claude-code claude_sdk_executor._run_query ignoring is_error and the SDK collapsing errors[] to the bare subtype "success") is fixed in a stacked PR on molecule-ai-workspace-template-claude-code (depends on this PR's sanitize_agent_error `reason` kwarg, which ships via the molecule-ai-workspace-runtime package). Tests: 4 new sanitize_agent_error reason tests (verbatim surfacing, secret scrub still applied, reason>stderr precedence, no-reason unchanged). Verified fail-before / pass-after; full sanitize suite green; no new regressions (the 2 pre-existing test_get_a2a_instructions_mcp failures are unrelated). Refs: internal#211, internal#212 Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-17 07:20:14 -07:00