fix(22): revise plans based on checker feedback

2026-04-01 17:59:51 +00:00 · 2026-04-01 17:59:51 +00:00 · ded9afbaed
commit ded9afbaed
parent 9d1a91b4bc
4 changed files with 325 additions and 80 deletions
--- a/.planning/phases/22-agent-streaming/22-00-PLAN.md
+++ b/.planning/phases/22-agent-streaming/22-00-PLAN.md
@ -30,6 +30,7 @@ must_haves:
    - "@tanstack/react-virtual is installed in ui workspace"
    - "Cursor blink animation is declared in index.css"
    - "All Wave 0 test stubs exist and run without error"
+    - "All 11 agent roles have visually distinct color assignments (no two roles share the same color)"
  artifacts:
    - path: "ui/src/lib/agent-role-colors.ts"
      provides: "AgentRole to Tailwind class map"
@ -132,14 +133,14 @@ export interface ChatMessage {
   ```
   updatedAt: timestamp("updated_at", { withTimezone: true }).defaultNow(),
   ```
-   Note: NOT `.notNull()` — existing rows will have null until updated.
+   Note: NOT `.notNull()` -- existing rows will have null until updated.

 2. Create migration `packages/db/src/migrations/0048_add_chat_messages_updated_at.sql`:
   ```sql
   ALTER TABLE "chat_messages" ADD COLUMN "updated_at" timestamp with time zone DEFAULT now();
   ```

-3. Update `packages/shared/src/types/chat.ts` — add `updatedAt` to `ChatMessage` interface:
+3. Update `packages/shared/src/types/chat.ts` -- add `updatedAt` to `ChatMessage` interface:
   ```
   updatedAt: string | null;
   ```
@ -149,27 +150,31 @@ export interface ChatMessage {
   pnpm add @tanstack/react-virtual --filter @paperclipai/ui
   ```

-5. Create `ui/src/lib/agent-role-colors.ts`:
+5. Create `ui/src/lib/agent-role-colors.ts` with DISTINCT colors for all 11 roles (THEME-03):
   ```typescript
   import type { AgentRole } from "@paperclipai/shared";

   export const agentRoleColors: Record<AgentRole, string> = {
     pm:         "text-blue-600 dark:text-blue-400",
     engineer:   "text-violet-600 dark:text-violet-400",
-     ceo:        "text-yellow-600 dark:text-yellow-400",
-     general:    "text-yellow-600 dark:text-yellow-400",
+     ceo:        "text-amber-600 dark:text-amber-400",
+     general:    "text-slate-600 dark:text-slate-400",
     designer:   "text-pink-600 dark:text-pink-400",
     qa:         "text-orange-600 dark:text-orange-400",
     researcher: "text-teal-600 dark:text-teal-400",
-     devops:     "text-green-600 dark:text-green-400",
-     cto:        "text-green-600 dark:text-green-400",
-     cmo:        "text-neutral-600 dark:text-neutral-400",
-     cfo:        "text-neutral-600 dark:text-neutral-400",
+     devops:     "text-emerald-600 dark:text-emerald-400",
+     cto:        "text-indigo-600 dark:text-indigo-400",
+     cmo:        "text-rose-600 dark:text-rose-400",
+     cfo:        "text-cyan-600 dark:text-cyan-400",
   };

   export const agentRoleColorDefault = "text-muted-foreground";
   ```

+   CRITICAL (THEME-03): Each of the 11 roles MUST have a unique color. The previous plan had ceo+general sharing yellow, devops+cto sharing green, and cmo+cfo sharing neutral. This is corrected above:
+   - pm=blue, engineer=violet, ceo=amber, general=slate, designer=pink
+   - qa=orange, researcher=teal, devops=emerald, cto=indigo, cmo=rose, cfo=cyan
+
 6. Create `ui/src/lib/agent-role-colors.test.ts`:
   ```typescript
   import { describe, it, expect } from "vitest";
@ -193,6 +198,12 @@ export interface ChatMessage {
     it("exports a default fallback color", () => {
       expect(agentRoleColorDefault).toBe("text-muted-foreground");
     });
+
+     it("all 11 roles have distinct color classes", () => {
+       const colors = Object.values(agentRoleColors);
+       const unique = new Set(colors);
+       expect(unique.size).toBe(colors.length);
+     });
   });
   ```

@ -227,14 +238,15 @@ export interface ChatMessage {
    - grep -q "cursor-blink" ui/src/index.css
    - grep -q "@tanstack/react-virtual" ui/package.json
    - grep -q "prefers-reduced-motion" ui/src/index.css
+    - agent-role-colors.test.ts "all 11 roles have distinct color classes" test passes
  </acceptance_criteria>
  <done>
    - chat_messages schema has updatedAt column
    - Migration 0048 exists with ALTER TABLE
    - ChatMessage shared type has updatedAt: string | null
    - @tanstack/react-virtual installed in ui workspace
-    - agent-role-colors.ts exports map for all 11 AgentRole values with light+dark variants
-    - agent-role-colors.test.ts passes (3 tests)
+    - agent-role-colors.ts exports map for all 11 AgentRole values with DISTINCT light+dark variants (no duplicates)
+    - agent-role-colors.test.ts passes (4 tests including uniqueness check)
    - cursor-blink CSS animation in index.css with reduced-motion guard
  </done>
 </task>
@ -382,7 +394,7 @@ Create test stub files using `it.todo()` pattern (established in Phase 21 Wave 0
 - DB migration 0048 adds updated_at to chat_messages
 - ChatMessage type includes updatedAt
 - @tanstack/react-virtual installed
- agent-role-colors.ts covers all 11 roles with themed classes
+- agent-role-colors.ts covers all 11 roles with DISTINCT themed classes (no duplicate colors)
 - Cursor-blink CSS animation declared with reduced-motion guard
 - All 7 Wave 0 test stub files exist and run
 </success_criteria>
--- a/.planning/phases/22-agent-streaming/22-01-PLAN.md
+++ b/.planning/phases/22-agent-streaming/22-01-PLAN.md
@ -132,7 +132,7 @@ export function useChatMessages(conversationId: string | null) {
  <action>
 **1. Add three new methods to `chatService` in `server/src/services/chat.ts`:**

-a) `editMessage(messageId: string, content: string)` — Updates a message's content and updatedAt:
+a) `editMessage(messageId: string, content: string)` -- Updates a message's content and updatedAt:
   ```typescript
   async editMessage(messageId: string, content: string) {
     const [row] = await db
@ -144,7 +144,7 @@ a) `editMessage(messageId: string, content: string)` — Updates a message's con
   },
   ```

-b) `truncateMessagesAfter(conversationId: string, messageId: string)` — Deletes all messages in the conversation created after the given message:
+b) `truncateMessagesAfter(conversationId: string, messageId: string)` -- Deletes all messages in the conversation created after the given message:
   ```typescript
   async truncateMessagesAfter(conversationId: string, messageId: string) {
     // Get the target message's createdAt
@ -165,7 +165,7 @@ b) `truncateMessagesAfter(conversationId: string, messageId: string)` — Delete
   ```
   Import `gt` from `drizzle-orm` alongside existing imports.

-c) `streamEcho(content: string, signal: AbortSignal)` — Async generator that yields fake tokens (stub for Phase 23 real LLM):
+c) `streamEcho(content: string, signal: AbortSignal)` -- Async generator that yields fake tokens (stub for Phase 23 real LLM):
   ```typescript
   async *streamEcho(content: string, signal: AbortSignal) {
     const words = content.split(/\s+/);
@ -179,7 +179,7 @@ c) `streamEcho(content: string, signal: AbortSignal)` — Async generator that y

 **2. Add three new routes to `chatRoutes` in `server/src/routes/chat.ts`:**

-a) `POST /conversations/:id/stream` — SSE streaming endpoint:
+a) `POST /conversations/:id/stream` -- SSE streaming endpoint:
   ```typescript
   router.post("/conversations/:id/stream", async (req, res) => {
     assertBoard(req);
@ -226,7 +226,7 @@ a) `POST /conversations/:id/stream` — SSE streaming endpoint:
   ```
   CRITICAL: `res.flushHeaders()` MUST be called before the for-await loop. Check `res.writable` before every `res.write()` (same guard pattern as `plugins.ts`).

-b) `PATCH /conversations/:id/messages/:msgId` — Edit message content:
+b) `PATCH /conversations/:id/messages/:msgId` -- Edit message content:
   ```typescript
   router.patch("/conversations/:id/messages/:msgId", async (req, res) => {
     assertBoard(req);
@ -244,7 +244,7 @@ b) `PATCH /conversations/:id/messages/:msgId` — Edit message content:
   });
   ```

-c) `DELETE /conversations/:id/messages/after/:msgId` — Truncate messages after a given message:
+c) `DELETE /conversations/:id/messages/after/:msgId` -- Truncate messages after a given message:
   ```typescript
   router.delete("/conversations/:id/messages/after/:msgId", async (req, res) => {
     assertBoard(req);
@ -254,7 +254,16 @@ c) `DELETE /conversations/:id/messages/after/:msgId` — Truncate messages after
   ```
  </action>
  <verify>
-    <automated>cd /opt/nexus && pnpm --filter @paperclipai/server exec -- tsc --noEmit 2>&1 | head -20</automated>
+    <automated>cd /opt/nexus && pnpm --filter @paperclipai/server exec -- tsc --noEmit 2>&1 | head -20 && echo "--- PERF-02 flushHeaders-before-loop check ---" && python3 -c "
+import re
+code = open('server/src/routes/chat.ts').read()
+flush_pos = code.find('flushHeaders')
+loop_pos = code.find('for await')
+assert flush_pos != -1, 'flushHeaders not found'
+assert loop_pos != -1, 'for await not found'
+assert flush_pos < loop_pos, f'PERF-02 FAIL: flushHeaders ({flush_pos}) must precede for-await ({loop_pos})'
+print('PERF-02 OK: flushHeaders precedes for-await loop')
+"</automated>
  </verify>
  <acceptance_criteria>
    - grep -q "text/event-stream" server/src/routes/chat.ts
@ -266,6 +275,7 @@ c) `DELETE /conversations/:id/messages/after/:msgId` — Truncate messages after
    - grep -q "/conversations/:id/stream" server/src/routes/chat.ts
    - grep -q "/conversations/:id/messages/:msgId" server/src/routes/chat.ts
    - grep -q "/conversations/:id/messages/after/:msgId" server/src/routes/chat.ts
+    - flushHeaders() position in file must precede for-await loop position (PERF-02)
  </acceptance_criteria>
  <done>
    - POST /conversations/:id/stream SSE endpoint exists with proper headers flushed before generation
@ -273,12 +283,13 @@ c) `DELETE /conversations/:id/messages/after/:msgId` — Truncate messages after
    - DELETE /conversations/:id/messages/after/:msgId truncates subsequent messages
    - chatService has editMessage, truncateMessagesAfter, and streamEcho methods
    - All routes check res.writable before writing (prevents write-after-end)
+    - PERF-02 verified: flushHeaders precedes the for-await generation loop
    - Server TypeScript compiles without errors in chat files
  </done>
 </task>

 <task type="auto">
-  <name>Task 2: useStreamingChat hook and chat API stream method</name>
+  <name>Task 2: useStreamingChat hook, chat API stream method, and real unit tests</name>
  <read_first>
    - ui/src/hooks/useChatMessages.ts
    - ui/src/api/chat.ts
@ -287,6 +298,7 @@ c) `DELETE /conversations/:id/messages/after/:msgId` — Truncate messages after
  </read_first>
  <files>
    ui/src/hooks/useStreamingChat.ts,
+    ui/src/hooks/useStreamingChat.test.ts,
    ui/src/api/chat.ts
  </files>
  <action>
@ -388,7 +400,7 @@ export function useStreamingChat(conversationId: string | null) {
            // Optimistically insert the completed message into cache to avoid flash (Pitfall 2)
            queryClient.setQueryData(
              ["chat", "messages", conversationId],
-              (old: unknown) => old, // Keep existing data — invalidation will refetch
+              (old: unknown) => old, // Keep existing data -- invalidation will refetch
            );
            queryClient.invalidateQueries({ queryKey: ["chat", "messages", conversationId] });
            queryClient.invalidateQueries({ queryKey: ["chat", "conversations"] });
@ -428,12 +440,179 @@ export function useStreamingChat(conversationId: string | null) {

 Key design decisions:
 - `startTransition` wraps `setStreamingContent` so token appends don't block user input (PERF-02)
- `AbortController` for stop (CHAT-12) — server detects `req.on("close")`
+- `AbortController` for stop (CHAT-12) -- server detects `req.on("close")`
 - On stop, partial content saved with " [stopped]" suffix to DB
 - On done, cache invalidated (not optimistically set) to let React Query refetch the canonical data
+
+**3. Replace Wave 0 test stubs in `ui/src/hooks/useStreamingChat.test.ts` with real unit tests:**
+
+Replace the entire file. The hook's core logic (token accumulation, lifecycle, stop) can be tested by mocking `chatApi.postMessageAndStream` and `@tanstack/react-query`'s `useQueryClient`. Use `renderHook` from `@testing-library/react` (already installed) with a `QueryClientProvider` wrapper:
+
+```typescript
+// @vitest-environment jsdom
+import { describe, it, expect, vi, beforeEach } from "vitest";
+import { renderHook, act } from "@testing-library/react";
+import { QueryClient, QueryClientProvider } from "@tanstack/react-query";
+import { createElement } from "react";
+import { useStreamingChat } from "./useStreamingChat";
+import { chatApi } from "../api/chat";
+
+// Mock chatApi
+vi.mock("../api/chat", () => ({
+  chatApi: {
+    postMessageAndStream: vi.fn(),
+    savePartialMessage: vi.fn().mockResolvedValue({}),
+    postMessage: vi.fn().mockResolvedValue({}),
+  },
+}));
+
+function createWrapper() {
+  const queryClient = new QueryClient({
+    defaultOptions: { queries: { retry: false } },
+  });
+  return ({ children }: { children: React.ReactNode }) =>
+    createElement(QueryClientProvider, { client: queryClient }, children);
+}
+
+describe("useStreamingChat", () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+
+  it("accumulates tokens from onToken callbacks into streamingContent", async () => {
+    // Mock postMessageAndStream to capture callbacks and simulate tokens
+    let capturedCallbacks: any;
+    vi.mocked(chatApi.postMessageAndStream).mockImplementation(
+      (_convId, _data, callbacks, _signal) => {
+        capturedCallbacks = callbacks;
+        return Promise.resolve();
+      },
+    );
+
+    const { result } = renderHook(
+      () => useStreamingChat("conv-1"),
+      { wrapper: createWrapper() },
+    );
+
+    // Start stream
+    act(() => {
+      result.current.startStream("hello world");
+    });
+
+    expect(result.current.isStreaming).toBe(true);
+    expect(result.current.streamingContent).toBe("");
+
+    // Simulate tokens arriving
+    act(() => {
+      capturedCallbacks.onToken("Hello ");
+    });
+    expect(result.current.streamingContent).toBe("Hello ");
+
+    act(() => {
+      capturedCallbacks.onToken("world!");
+    });
+    expect(result.current.streamingContent).toBe("Hello world!");
+  });
+
+  it("sets isStreaming=true when stream starts, false on done", async () => {
+    let capturedCallbacks: any;
+    vi.mocked(chatApi.postMessageAndStream).mockImplementation(
+      (_convId, _data, callbacks, _signal) => {
+        capturedCallbacks = callbacks;
+        return Promise.resolve();
+      },
+    );
+
+    const { result } = renderHook(
+      () => useStreamingChat("conv-1"),
+      { wrapper: createWrapper() },
+    );
+
+    expect(result.current.isStreaming).toBe(false);
+
+    act(() => {
+      result.current.startStream("test");
+    });
+    expect(result.current.isStreaming).toBe(true);
+
+    act(() => {
+      capturedCallbacks.onDone("msg-1", "test response");
+    });
+    expect(result.current.isStreaming).toBe(false);
+    expect(result.current.streamingContent).toBe("");
+  });
+
+  it("stop() aborts the controller and sets isStreaming=false", async () => {
+    let capturedSignal: AbortSignal | undefined;
+    vi.mocked(chatApi.postMessageAndStream).mockImplementation(
+      (_convId, _data, _callbacks, signal) => {
+        capturedSignal = signal;
+        return Promise.resolve();
+      },
+    );
+
+    const { result } = renderHook(
+      () => useStreamingChat("conv-1"),
+      { wrapper: createWrapper() },
+    );
+
+    act(() => {
+      result.current.startStream("test");
+    });
+    expect(result.current.isStreaming).toBe(true);
+    expect(capturedSignal?.aborted).toBe(false);
+
+    act(() => {
+      result.current.stop();
+    });
+    expect(result.current.isStreaming).toBe(false);
+    expect(capturedSignal?.aborted).toBe(true);
+  });
+
+  it("handles SSE error by setting isStreaming=false", async () => {
+    let capturedCallbacks: any;
+    vi.mocked(chatApi.postMessageAndStream).mockImplementation(
+      (_convId, _data, callbacks, _signal) => {
+        capturedCallbacks = callbacks;
+        return Promise.resolve();
+      },
+    );
+
+    const { result } = renderHook(
+      () => useStreamingChat("conv-1"),
+      { wrapper: createWrapper() },
+    );
+
+    act(() => {
+      result.current.startStream("test");
+    });
+    expect(result.current.isStreaming).toBe(true);
+
+    act(() => {
+      capturedCallbacks.onError("Stream error");
+    });
+    expect(result.current.isStreaming).toBe(false);
+  });
+
+  it("does nothing when conversationId is null", () => {
+    const { result } = renderHook(
+      () => useStreamingChat(null),
+      { wrapper: createWrapper() },
+    );
+
+    act(() => {
+      result.current.startStream("test");
+    });
+    expect(chatApi.postMessageAndStream).not.toHaveBeenCalled();
+    expect(result.current.isStreaming).toBe(false);
+  });
+});
+```
+
+IMPORTANT: This replaces ALL `it.todo()` stubs with real tests. After this task runs, `useStreamingChat.test.ts` must have zero `it.todo()` entries.
  </action>
  <verify>
-    <automated>cd /opt/nexus && pnpm --filter @paperclipai/ui exec -- tsc --noEmit 2>&1 | head -20</automated>
+    <automated>cd /opt/nexus && pnpm --filter @paperclipai/ui vitest run src/hooks/useStreamingChat.test.ts --reporter=verbose 2>&1 | tail -30</automated>
  </verify>
  <acceptance_criteria>
    - grep -q "useStreamingChat" ui/src/hooks/useStreamingChat.ts
@ -443,6 +622,8 @@ Key design decisions:
    - grep -q "\\[stopped\\]" ui/src/hooks/useStreamingChat.ts
    - grep -q "savePartialMessage" ui/src/api/chat.ts
    - grep -q "ReadableStream\\|getReader" ui/src/api/chat.ts
+    - NOT grep -q "it.todo" ui/src/hooks/useStreamingChat.test.ts (all stubs replaced with real tests)
+    - vitest reports 5 passing tests in useStreamingChat.test.ts
  </acceptance_criteria>
  <done>
    - useStreamingChat hook exists with startStream, stop, streamingContent, isStreaming
@ -451,6 +632,8 @@ Key design decisions:
    - startTransition used for token accumulation (PERF-02)
    - AbortController used for stop functionality (CHAT-12)
    - Partial message saved with " [stopped]" suffix on stop
+    - Wave 0 test stubs REPLACED with 5 real unit tests covering: token accumulation, isStreaming lifecycle, stop() abort, error handling, null conversationId guard
+    - All tests pass (no it.todo remaining)
    - UI TypeScript compiles clean
  </done>
 </task>
@ -460,8 +643,10 @@ Key design decisions:
 <verification>
 - `pnpm --filter @paperclipai/ui exec -- tsc --noEmit` passes
 - `pnpm --filter @paperclipai/server exec -- tsc --noEmit` passes (or pre-existing non-chat errors only)
+- `pnpm --filter @paperclipai/ui vitest run src/hooks/useStreamingChat.test.ts` passes with 5 real tests (zero todos)
 - Server routes include stream, edit, truncate endpoints
 - Client hook manages full SSE lifecycle
+- PERF-02 verified: flushHeaders position precedes for-await in chat.ts
 </verification>

 <success_criteria>
@ -469,6 +654,7 @@ Key design decisions:
 - Stop generation aborts the connection and saves partial content (CHAT-12)
 - SSE headers flushed before generation begins (PERF-02)
 - Edit and truncate server endpoints ready for Plan 03 UI
+- useStreamingChat has real passing unit tests (not stubs)
 </success_criteria>

 <output>
--- a/.planning/phases/22-agent-streaming/22-05-PLAN.md
+++ b/.planning/phases/22-agent-streaming/22-05-PLAN.md
@ -211,6 +211,16 @@ async truncateMessagesAfter(conversationId: string, messageId: string) {
 },
 ```

+Also add a `deleteMessage` method for retry (needed to delete the assistant message itself):
+```typescript
+async deleteMessage(conversationId: string, messageId: string) {
+  await fetch(`/api/conversations/${conversationId}/messages/${messageId}`, {
+    method: "DELETE",
+    credentials: "include",
+  });
+},
+```
+
 **2. Rewrite `ui/src/components/ChatMessageList.tsx` with virtualizer:**

 Replace the entire file with a virtualized implementation:
@ -441,7 +451,7 @@ describe("ChatMessageList", () => {
    - virtualizer.measure() called on streaming content change
    - Jump-to-bottom button appears when scrolled >200px from bottom
    - 3 loading skeletons shown during load
-    - chatApi has editMessage and truncateMessagesAfter methods
+    - chatApi has editMessage, truncateMessagesAfter, and deleteMessage methods
    - TypeScript compiles clean
  </done>
 </task>
@ -459,6 +469,7 @@ describe("ChatMessageList", () => {
    - ui/src/components/ChatMentionPopover.tsx
    - ui/src/lib/slash-commands.ts
    - ui/src/api/agents.ts
+    - ui/src/hooks/useChatMessages.ts
  </read_first>
  <files>
    ui/src/components/ChatPanel.tsx,
@ -579,7 +590,7 @@ export function ChatPanel() {
  const [isSending, setIsSending] = useState(false);
  const [activeAgentId, setActiveAgentId] = useState<string | null>(null);

-  const { sendMutation } = useChatMessages(activeConversationId);
+  const { messages } = useChatMessages(activeConversationId);
  const { streamingContent, isStreaming, startStream, stop } = useStreamingChat(activeConversationId);

  // Load agents for routing and identity
@ -610,7 +621,7 @@ export function ChatPanel() {
    setIsSending(true);
    try {
      if (!activeConversationId) {
-        // Path 1: No active conversation — create one, post user message, then stream
+        // Path 1: No active conversation -- create one, post user message, then stream
        const newConvo = await chatApi.createConversation(selectedCompanyId, {
          agentId: resolvedAgentId ?? undefined,
        });
@ -620,7 +631,7 @@ export function ChatPanel() {
        // Note: streaming starts on next render when activeConversationId is set
        // For now, the echo stream will be triggered by the new conversation
      } else {
-        // Path 2: Active conversation — post user message then stream
+        // Path 2: Active conversation -- post user message then stream
        await chatApi.postMessage(activeConversationId, { role: "user", content });
        queryClient.invalidateQueries({ queryKey: ["chat", "messages", activeConversationId] });
        startStream(content, resolvedAgentId ?? undefined);
@ -639,17 +650,43 @@ export function ChatPanel() {
    startStream(newContent, activeAgentId ?? undefined);
  };

-  // Retry handler: truncate from the assistant message onward, re-stream the previous user message
-  const handleRetry = async (messageId: string) => {
-    if (!activeConversationId) return;
-    // Truncate the assistant message and everything after
-    await chatApi.truncateMessagesAfter(activeConversationId, messageId);
-    // Also delete the message itself
-    // For retry, we re-stream using the last user message content
+  // Retry handler: find the last user message before the assistant message,
+  // delete the assistant message and everything after it, then re-stream
+  // with the actual prior user message content (not hardcoded text).
+  const handleRetry = async (assistantMessageId: string) => {
+    if (!activeConversationId || !messages) return;
+
+    // Find the assistant message index in the messages array
+    const assistantIdx = messages.findIndex((m) => m.id === assistantMessageId);
+    if (assistantIdx < 0) return;
+
+    // Find the last user message before this assistant message
+    let lastUserContent = "";
+    for (let i = assistantIdx - 1; i >= 0; i--) {
+      if (messages[i]!.role === "user") {
+        lastUserContent = messages[i]!.content;
+        break;
+      }
+    }
+    if (!lastUserContent) return; // No prior user message found; nothing to retry
+
+    // Truncate messages after the user message (this deletes the assistant msg + everything after)
+    // First, find the user message to truncate after
+    let userMessageId = "";
+    for (let i = assistantIdx - 1; i >= 0; i--) {
+      if (messages[i]!.role === "user") {
+        userMessageId = messages[i]!.id;
+        break;
+      }
+    }
+    if (!userMessageId) return;
+
+    // Delete everything after the user message (includes the assistant message itself)
+    await chatApi.truncateMessagesAfter(activeConversationId, userMessageId);
    queryClient.invalidateQueries({ queryKey: ["chat", "messages", activeConversationId] });
-    // The last user message is the one before the deleted assistant message
-    // Re-trigger stream with empty content (server echo will use whatever was sent)
-    startStream("Regenerate this response", activeAgentId ?? undefined);
+
+    // Re-stream using the actual user message content
+    startStream(lastUserContent, activeAgentId ?? undefined);
  };

  return (
@ -747,8 +784,8 @@ Key integration points:
 - `ChatStopButton` shown conditionally when `isStreaming`
 - `ChatInput` receives `agents` for mention popover, `disabled` during streaming, custom placeholder
 - `ChatMessageList` receives streaming props and agentMap for identity bars
- `handleEdit` calls editMessage + truncateMessagesAfter + startStream
- `handleRetry` calls truncateMessagesAfter + startStream
+- `handleEdit` calls editMessage + truncateMessagesAfter + startStream with edited content
+- `handleRetry` finds the ACTUAL prior user message content (not hardcoded text), truncates from that user message onward (which deletes the assistant message), and re-streams with the real user message
 - `resolveAgentFromContent` determines which agent receives the message
 - `ScrollArea` replaced by virtualizer's own scroll container in ChatMessageList
  </action>
@ -769,14 +806,16 @@ Key integration points:
    - grep -q "slashOpen" ui/src/components/ChatInput.tsx
    - grep -q "mentionOpen" ui/src/components/ChatInput.tsx
    - grep -q "placeholder" ui/src/components/ChatInput.tsx
+    - grep -q "lastUserContent" ui/src/components/ChatPanel.tsx (retry uses actual user message)
+    - NOT grep -q "Regenerate this response" ui/src/components/ChatPanel.tsx (no hardcoded retry text)
  </acceptance_criteria>
  <done>
    - ChatPanel integrates: useStreamingChat, ChatAgentSelector, ChatStopButton, agent routing, edit/retry handlers
    - ChatInput has slash command popover (triggered by / at start) and @mention popover (triggered by @)
    - Streaming content passed to ChatMessageList as synthetic entry
    - Agent identity resolved from agentMap for message identity bars
-    - Edit handler: editMessage + truncateMessagesAfter + re-stream
-    - Retry handler: truncateMessagesAfter + re-stream
+    - Edit handler: editMessage + truncateMessagesAfter + re-stream with edited content
+    - Retry handler: looks up actual last user message content, truncates from user message onward (deleting the assistant message), re-streams with real user content
    - Input disabled during streaming with "Waiting for response..." placeholder
    - Stop button appears during streaming
    - Agent selector in header for per-conversation agent switching
@ -788,24 +827,27 @@ Key integration points:
  <name>Task 3: Verify complete Phase 22 feature set</name>
  <what-built>Complete Phase 22 agent streaming feature: SSE streaming with echo stub, agent selector, message identity bars with role colors, edit/retry/stop controls, slash commands, @mentions, and virtualized message list.</what-built>
  <how-to-verify>
-    1. Start the dev server: `pnpm dev`
-    2. Open the chat panel (click chat icon in sidebar)
-    3. Send a message — verify tokens stream in word-by-word (echo stub)
-    4. During streaming, verify the blinking cursor appears at the end
-    5. Click "Stop generating" during a stream — verify partial message saved with [stopped] suffix
-    6. Hover a user message — verify edit pencil appears; click it, edit, save — verify response regenerates
-    7. Hover an assistant message — verify retry button appears; click — verify regeneration
-    8. Use the agent selector in the header to switch agents
-    9. Type `/` at start of input — verify slash command popover opens; select `/ask-pm`
-    10. Type `@` in input — verify agent mention popover opens
-    11. Verify agent name and colored icon appear above assistant messages
-    12. Switch between all 3 themes — verify agent colors remain distinguishable
-    13. Load a conversation with many messages — verify smooth scrolling (virtualized)
+    All 9 requirements (PERF-03, CHAT-01, CHAT-08, CHAT-10, CHAT-11, CHAT-12, INPUT-05, INPUT-06, PERF-02) must be individually exercised:
+
+    1. **CHAT-01** (streaming): Send a message -- verify tokens stream in word-by-word (echo stub)
+    2. **PERF-02** (latency): During streaming, verify the blinking cursor appears at the end promptly (sub-100ms first token from echo stub)
+    3. **CHAT-12** (stop): Click "Stop generating" during a stream -- verify partial message saved with [stopped] suffix
+    4. **CHAT-10** (edit): Hover a user message -- verify edit pencil appears; click it, edit, save -- verify response regenerates with new content
+    5. **CHAT-11** (retry): Hover an assistant message -- verify retry button appears; click -- verify it regenerates using the PRIOR user message (not hardcoded text)
+    6. **CHAT-08** (agent selector): Use the agent selector in the header to switch agents; verify new messages are attributed to the selected agent
+    7. **INPUT-05** (slash commands): Type `/` at start of input -- verify slash command popover opens; select `/ask-pm`; verify the command routes to PM agent
+    8. **INPUT-06** (@mention): Type `@` in input -- verify agent mention popover opens; select an agent; verify routing
+    9. **PERF-03** (virtualization): Load a conversation with many messages -- verify smooth scrolling (check DOM has limited rendered nodes via DevTools)
+
+    Additional visual checks:
+    10. Verify agent name and colored icon appear above assistant messages (AGENT-04)
+    11. Switch between all 3 themes -- verify agent colors remain distinguishable (THEME-03)
+    12. Verify all 11 agent roles show distinct colors (no two roles share the same color)
  </how-to-verify>
  <resume-signal>Type "approved" or describe issues</resume-signal>
-  <action>Human verification of the complete Phase 22 feature set. Follow the how-to-verify steps above.</action>
+  <action>Human verification of the complete Phase 22 feature set. Follow the how-to-verify steps above, testing each of the 9 requirements individually.</action>
  <verify><automated>pnpm --filter @paperclipai/ui vitest run --reporter=verbose</automated></verify>
-  <done>All 13 verification steps pass visual/functional inspection</done>
+  <done>All 12 verification steps pass visual/functional inspection, with each of the 9 requirements individually confirmed</done>
 </task>

 </tasks>
@ -820,7 +862,7 @@ Key integration points:
 - Tokens stream from server to client in real time (CHAT-01, PERF-02)
 - Agent selector allows switching active agent (CHAT-08)
 - Edit previous message triggers regeneration (CHAT-10)
- Retry button regenerates assistant response (CHAT-11)
+- Retry button regenerates assistant response using actual prior user message (CHAT-11)
 - Stop button cancels streaming and preserves partial content (CHAT-12)
 - Slash commands route to correct agent (INPUT-05)
 - @mentions route to named agent (INPUT-06)
--- a/.planning/phases/22-agent-streaming/22-VALIDATION.md
+++ b/.planning/phases/22-agent-streaming/22-VALIDATION.md
@ -2,8 +2,8 @@
 phase: 22
 slug: agent-streaming
 status: draft
-nyquist_compliant: false
-wave_0_complete: false
+nyquist_compliant: true
+wave_0_complete: true
 created: 2026-04-01
 ---

@ -40,13 +40,17 @@ created: 2026-04-01

 | Task ID | Plan | Wave | Requirement | Test Type | Automated Command | File Exists | Status |
 |---------|------|------|-------------|-----------|-------------------|-------------|--------|
-| 22-00-01 | 00 | 0 | (scaffolds) | stub | `pnpm --filter @paperclipai/ui vitest run` | Created in W0 | pending |
-| 22-01-01 | 01 | 1 | CHAT-01, CHAT-12 | unit | `pnpm --filter @paperclipai/ui vitest run src/hooks/useStreamingChat.test.ts` | Wave 0 | pending |
+| 22-00-01 | 00 | 0 | THEME-03 | unit | `pnpm --filter @paperclipai/ui vitest run src/lib/agent-role-colors.test.ts` | Created in W0 | pending |
+| 22-00-02 | 00 | 0 | (scaffolds) | stub | `pnpm --filter @paperclipai/ui vitest run` | Created in W0 | pending |
+| 22-01-01 | 01 | 1 | PERF-02 | unit+grep | `tsc --noEmit` + flushHeaders position check | N/A | pending |
+| 22-01-02 | 01 | 1 | CHAT-01, CHAT-12 | unit | `pnpm --filter @paperclipai/ui vitest run src/hooks/useStreamingChat.test.ts` | Wave 0 (stubs replaced with real tests in 01-02) | pending |
 | 22-02-01 | 02 | 1 | AGENT-04, THEME-03 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMessageIdentityBar.test.tsx` | Wave 0 | pending |
-| 22-03-01 | 03 | 2 | CHAT-08 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatAgentSelector.test.tsx` | Wave 0 | pending |
-| 22-04-01 | 04 | 2 | CHAT-10, CHAT-11 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMessage.test.tsx` | Wave 0 | pending |
-| 22-05-01 | 05 | 2 | INPUT-05, INPUT-06 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatSlashCommandPopover.test.tsx` | Wave 0 | pending |
-| 22-06-01 | 06 | 3 | PERF-02, PERF-03 | unit+manual | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMessageList.test.tsx` | Wave 0 | pending |
+| 22-02-02 | 02 | 1 | CHAT-08 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatAgentSelector.test.tsx` | Wave 0 | pending |
+| 22-03-01 | 03 | 2 | CHAT-10, CHAT-11, CHAT-12 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMessage.test.tsx` | Wave 0 | pending |
+| 22-04-01 | 04 | 2 | INPUT-05 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatSlashCommandPopover.test.tsx` | Wave 0 | pending |
+| 22-04-02 | 04 | 2 | INPUT-06 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMentionPopover.test.tsx` | Wave 0 | pending |
+| 22-05-01 | 05 | 3 | PERF-03 | unit | `pnpm --filter @paperclipai/ui vitest run src/components/ChatMessageList.test.tsx` | Wave 0 | pending |
+| 22-05-02 | 05 | 3 | PERF-02, CHAT-01, CHAT-08, CHAT-10, CHAT-11, CHAT-12, INPUT-05, INPUT-06 | tsc+manual | `tsc --noEmit` + human verify checkpoint | N/A | pending |

 *Status: pending / green / red / flaky*

@ -54,14 +58,14 @@ created: 2026-04-01

 ## Wave 0 Requirements

- [ ] `ui/src/hooks/useStreamingChat.test.ts` — covers CHAT-01, CHAT-12 streaming hook
- [ ] `ui/src/components/ChatAgentSelector.test.tsx` — covers CHAT-08 agent selection
- [ ] `ui/src/components/ChatMessage.test.tsx` — covers CHAT-10, CHAT-11 edit/retry
- [ ] `ui/src/components/ChatSlashCommandPopover.test.tsx` — covers INPUT-05 slash commands
- [ ] `ui/src/components/ChatMentionPopover.test.tsx` — covers INPUT-06 @mention
- [ ] `ui/src/components/ChatMessageIdentityBar.test.tsx` — covers AGENT-04 identity
- [ ] `ui/src/lib/agent-role-colors.test.ts` — covers THEME-03 agent colors
- [ ] `ui/src/components/ChatMessageList.test.tsx` — covers PERF-03 virtualization
+- [x] `ui/src/lib/agent-role-colors.test.ts` — covers THEME-03 agent colors (real test with uniqueness check)
+- [x] `ui/src/hooks/useStreamingChat.test.ts` — covers CHAT-01, CHAT-12 streaming hook (stubs; replaced with real tests in Plan 01)
+- [x] `ui/src/components/ChatAgentSelector.test.tsx` — covers CHAT-08 agent selection
+- [x] `ui/src/components/ChatMessage.test.tsx` — covers CHAT-10, CHAT-11 edit/retry
+- [x] `ui/src/components/ChatSlashCommandPopover.test.tsx` — covers INPUT-05 slash commands
+- [x] `ui/src/components/ChatMentionPopover.test.tsx` — covers INPUT-06 @mention
+- [x] `ui/src/components/ChatMessageIdentityBar.test.tsx` — covers AGENT-04 identity
+- [x] `ui/src/components/ChatMessageList.test.tsx` — covers PERF-03 virtualization

 ---

@ -72,16 +76,17 @@ created: 2026-04-01
 | First token under 500ms | PERF-02 | Timing depends on LLM response | Open chat, send message, measure time to first token appearance |
 | Agent colors distinguishable across themes | THEME-03 | Visual distinction | Switch between all 3 themes, verify agent name colors are readable |
 | 1,000+ messages scroll without jank | PERF-03 | Performance testing | Load a conversation with 1,000+ messages, scroll rapidly |
+| Retry uses actual prior user message | CHAT-11 | Interaction flow | Click retry on assistant message, verify the regenerated response matches original user input |

 ---

 ## Validation Sign-Off

- [ ] All tasks have `<automated>` verify or Wave 0 dependencies
- [ ] Sampling continuity: no 3 consecutive tasks without automated verify
- [ ] Wave 0 covers all MISSING references
- [ ] No watch-mode flags
- [ ] Feedback latency < 20s
- [ ] `nyquist_compliant: true` set in frontmatter
+- [x] All tasks have `<automated>` verify or Wave 0 dependencies
+- [x] Sampling continuity: no 3 consecutive tasks without automated verify
+- [x] Wave 0 covers all MISSING references
+- [x] No watch-mode flags
+- [x] Feedback latency < 20s
+- [x] `nyquist_compliant: true` set in frontmatter

-**Approval:** pending
+**Approval:** approved