2026-05-25 04:54:05 -04:00
2 changed files with 165 additions and 24 deletions
@@ -22,6 +22,10 @@ from datetime import datetime, timezone
 from pathlib import Path
 from .. import supervise as _supervise
 from ..backend.docker.cred_proxy_apply import (
    CredProxyApplyError,
    apply_routes_change,
 )
 from ..log import info
 from ..supervise import (
    ACTION_OPERATOR_EDIT,
@@ -33,6 +37,7 @@ from ..supervise import (
    STATUS_MODIFIED,
    STATUS_REJECTED,
    TOOL_CAPABILITY_BLOCK,
    TOOL_CRED_PROXY_BLOCK,
    list_pending_proposals,
    render_diff,
    write_audit_entry,
@@ -78,9 +83,28 @@ def approve(
    notes: str = "",
    final_file: str | None = None,
 ) -> None:
-    """Write an approval response and an audit entry. If `final_file`
+    """Apply the proposal to the running sidecar, write the response
-    is provided the status is `modified`; otherwise `approved`."""
+    file the agent's tool call is waiting on, and append an audit
    entry. If `final_file` is provided the status is `modified`;
    otherwise `approved`.
    Raises CredProxyApplyError if the cred-proxy-block apply fails
    (sidecar down, invalid JSON survived the operator's modify).
    On failure no response is written and no audit entry is
    appended — the proposal stays pending so the operator can fix
    the input and retry."""
    status = STATUS_MODIFIED if final_file is not None else STATUS_APPROVED
    file_to_apply = final_file if final_file is not None else qp.proposal.proposed_file
    diff_before, diff_after = "", ""
    if qp.proposal.tool == TOOL_CRED_PROXY_BLOCK:
        diff_before, diff_after = apply_routes_change(
            qp.proposal.bottle_slug, file_to_apply,
        )
    # pipelock-block + capability-block remediation lands in PRDs
    # 0015 + 0016; for 0014 they remain no-op approvals and the
    # audit diff stays empty.
    response = Response(
        proposal_id=qp.proposal.id,
        status=status,
@@ -88,11 +112,16 @@ def approve(
        final_file=final_file,
    )
    write_response(qp.queue_dir, response)
-    _write_audit(qp, action=status, notes=notes, final_file=final_file)
+    _write_audit(
        qp, action=status, notes=notes,
        diff_before=diff_before, diff_after=diff_after,
    )
 def reject(qp: QueuedProposal, *, reason: str) -> None:
-    """Write a rejection response and an audit entry."""
+    """Write a rejection response and an audit entry. No remediation
    apply happens on reject — the agent sees the rejection and
    decides whether to retry / give up."""
    response = Response(
        proposal_id=qp.proposal.id,
        status=STATUS_REJECTED,
@@ -100,7 +129,7 @@ def reject(qp: QueuedProposal, *, reason: str) -> None:
        final_file=None,
    )
    write_response(qp.queue_dir, response)
-    _write_audit(qp, action=STATUS_REJECTED, notes=reason, final_file=None)
+    _write_audit(qp, action=STATUS_REJECTED, notes=reason, diff_before="", diff_after="")
 def _write_audit(
@@ -108,19 +137,21 @@ def _write_audit(
    *,
    action: str,
    notes: str,
-    final_file: str | None,
+    diff_before: str,
    diff_after: str,
 ) -> None:
    """Audit log for cred-proxy / pipelock tools. capability-block has
    no audit log (its changes are captured by the bottle's rebuild
-    record + git history per PRD 0016)."""
+    record + git history per PRD 0016).
    For cred-proxy-block approvals the (before, after) come from the
    apply_routes_change return — a real fetched-from-sidecar diff.
    For rejections, or for tools whose remediation hasn't landed yet
    (pipelock in 0014, capability anywhere), both are empty strings
    and the audit diff renders as empty."""
    component = COMPONENT_FOR_TOOL.get(qp.proposal.tool)
    if component is None:
        # capability-block: skip audit log; 0016 records via rebuild.
        return
    # v1 audit diff is empty: 0013's no-op handler doesn't have the
    # actual current-on-disk file to diff against, only the agent's
    # proposed file. 0014 / 0015 fill in the real diff against the
    # live routes.json / allowlist after writing the change.
    write_audit_entry(AuditEntry(
        timestamp=datetime.now(timezone.utc).isoformat(),
        bottle_slug=qp.proposal.bottle_slug,
@@ -128,11 +159,7 @@ def _write_audit(
        operator_action=action,
        operator_notes=notes,
        justification=qp.proposal.justification,
-        diff=render_diff(
+        diff=render_diff(diff_before, diff_after, label=component),
            "",
            final_file if final_file is not None else qp.proposal.proposed_file,
            label=component,
        ),
    ))
@@ -228,15 +255,21 @@ def _main_loop(stdscr: "curses._CursesWindow") -> None:
        elif key in (curses.KEY_ENTER, 10, 13, ord("v")):
            _detail_view(stdscr, qp)
        elif key == ord("a"):
            try:
                approve(qp)
                status_line = f"approved {qp.proposal.tool} for [{qp.proposal.bottle_slug}]"
            except CredProxyApplyError as e:
                status_line = f"apply failed: {e}"
        elif key == ord("m"):
            edited = _modify(stdscr, qp)
            if edited is None:
                status_line = "modify aborted (no change)"
            else:
                try:
                    approve(qp, final_file=edited, notes="operator modified before approving")
                    status_line = f"modified+approved {qp.proposal.tool} for [{qp.proposal.bottle_slug}]"
                except CredProxyApplyError as e:
                    status_line = f"apply failed: {e}"
        elif key == ord("r"):
            reason = _prompt(stdscr, "reject reason: ")
            if reason:
@@ -316,12 +349,18 @@ def _detail_view(stdscr: "curses._CursesWindow", qp: QueuedProposal) -> None:
        elif key == ord("G"):
            offset = max(0, len(lines) - 1)
        elif key == ord("a"):
            try:
                approve(qp)
            except CredProxyApplyError:
                pass  # Status surfaces back in the list view's render.
            return
        elif key == ord("m"):
            edited = _modify(stdscr, qp)
            if edited is not None:
                try:
                    approve(qp, final_file=edited, notes="operator modified before approving")
                except CredProxyApplyError:
                    pass
            return
        elif key == ord("r"):
            reason = _prompt(stdscr, "reject reason: ")
@@ -1,8 +1,12 @@
-"""Unit: dashboard headless paths (PRD 0013 phase 4).
+"""Unit: dashboard headless paths (PRD 0013 phase 4, PRD 0014).
 The curses TUI itself isn't exercised here — these tests cover the
 discovery + approve/reject + audit-write paths that the TUI's key
 handlers call into.
 apply_routes_change is stubbed at the dashboard module level so the
 tests don't need a running cred-proxy sidecar; the real docker
 exec/cp/SIGHUP plumbing is covered by the integration test.
 """
 import os
@@ -12,6 +16,7 @@ from datetime import datetime, timezone
 from pathlib import Path
 from claude_bottle import supervise
 from claude_bottle.backend.docker.cred_proxy_apply import CredProxyApplyError
 from claude_bottle.cli import dashboard
 from claude_bottle.supervise import (
    Proposal,
@@ -110,8 +115,15 @@ class TestDiscoverPending(_FakeHomeMixin, unittest.TestCase):
 class TestApproveReject(_FakeHomeMixin, unittest.TestCase):
    def setUp(self):
        self._setup_fake_home()
        self._original_apply = dashboard.apply_routes_change
        # Default stub: succeed with deterministic before/after so the
        # audit log shows a non-empty diff.
        dashboard.apply_routes_change = lambda slug, content: (
            '{"routes": []}\n', content,
        )
    def tearDown(self):
        dashboard.apply_routes_change = self._original_apply
        self._teardown_fake_home()
    def _enqueue(self, tool: str = TOOL_CRED_PROXY_BLOCK):
@@ -166,6 +178,96 @@ class TestApproveReject(_FakeHomeMixin, unittest.TestCase):
        self.assertEqual(0, len(read_audit_entries("cred-proxy", "dev")))
 class TestCredProxyApplyWiring(_FakeHomeMixin, unittest.TestCase):
    """PRD 0014 Phase 3: approve() on a cred-proxy-block proposal
    must call apply_routes_change with the right args and surface
    its failures."""
    def setUp(self):
        self._setup_fake_home()
        self._original_apply = dashboard.apply_routes_change
    def tearDown(self):
        dashboard.apply_routes_change = self._original_apply
        self._teardown_fake_home()
    def _enqueue_cred_proxy(self, proposed: str = '{"routes": []}\n'):
        p = Proposal.new(
            bottle_slug="dev", tool=TOOL_CRED_PROXY_BLOCK,
            proposed_file=proposed,
            justification="need a route",
            current_file_hash=sha256_hex(proposed),
            now=FIXED,
        )
        qdir = supervise.queue_dir_for_slug("dev")
        qdir.mkdir(parents=True, exist_ok=True)
        supervise.write_proposal(qdir, p)
        return dashboard.QueuedProposal(proposal=p, queue_dir=qdir)
    def test_cred_proxy_block_calls_apply_with_proposed_file(self):
        calls = []
        dashboard.apply_routes_change = lambda slug, content: (
            calls.append((slug, content)) or ("before", content)
        )
        qp = self._enqueue_cred_proxy(proposed='{"routes": [{"path": "/new/"}]}\n')
        dashboard.approve(qp)
        self.assertEqual(1, len(calls))
        slug, content = calls[0]
        self.assertEqual("dev", slug)
        self.assertEqual('{"routes": [{"path": "/new/"}]}\n', content)
    def test_modify_passes_final_file_to_apply(self):
        calls = []
        dashboard.apply_routes_change = lambda slug, content: (
            calls.append(content) or ("before", content)
        )
        qp = self._enqueue_cred_proxy()
        dashboard.approve(qp, final_file='{"routes": [{"path": "/edited/"}]}\n', notes="tweaked")
        self.assertEqual(['{"routes": [{"path": "/edited/"}]}\n'], calls)
    def test_apply_failure_blocks_response_and_audit(self):
        dashboard.apply_routes_change = lambda slug, content: (_ for _ in ()).throw(
            CredProxyApplyError("docker exec failed")
        )
        qp = self._enqueue_cred_proxy()
        with self.assertRaises(CredProxyApplyError):
            dashboard.approve(qp)
        # No response file (proposal stays pending).
        self.assertEqual(
            [qp.proposal.id],
            [p.id for p in supervise.list_pending_proposals(qp.queue_dir)],
        )
        # No audit entry.
        self.assertEqual([], read_audit_entries("cred-proxy", "dev"))
    def test_real_diff_lands_in_audit(self):
        dashboard.apply_routes_change = lambda slug, content: (
            '{"routes": []}\n',  # before
            '{"routes": [{"path": "/new/"}]}\n',  # after
        )
        qp = self._enqueue_cred_proxy(proposed='{"routes": [{"path": "/new/"}]}\n')
        dashboard.approve(qp)
        entries = read_audit_entries("cred-proxy", "dev")
        self.assertEqual(1, len(entries))
        self.assertIn('+{"routes": [{"path": "/new/"}]}', entries[0].diff)
        self.assertIn('-{"routes": []}', entries[0].diff)
    def test_reject_does_not_call_apply(self):
        called = []
        dashboard.apply_routes_change = lambda slug, content: (
            called.append(True) or ("", content)
        )
        qp = self._enqueue_cred_proxy()
        dashboard.reject(qp, reason="no thanks")
        self.assertEqual([], called)
        # Reject still writes a response + audit entry with empty diff.
        resp = read_response(qp.queue_dir, qp.proposal.id)
        self.assertEqual(STATUS_REJECTED, resp.status)
        entries = read_audit_entries("cred-proxy", "dev")
        self.assertEqual(1, len(entries))
        self.assertEqual("", entries[0].diff)
 class TestEditInEditor(unittest.TestCase):
    def test_runs_editor_returns_edited_content(self):
        # Fake "editor" is /bin/sh -c 'cat <<EOF > $1 ... EOF'