coder
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 22 additions & 4 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 22 additions & 4 deletions
diff --git a/‎src/node/services/mock/scenarios.ts‎
Lines changed: 2 additions & 0 deletions b/‎src/node/services/mock/scenarios.ts‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/node/services/mock/scenarios/errorScenarios.ts‎
Lines changed: 91 additions & 0 deletions b/‎src/node/services/mock/scenarios/errorScenarios.ts‎
Lines changed: 91 additions & 0 deletions
diff --git a/‎tests/e2e/scenarios/errorDisplay.spec.ts‎
Lines changed: 126 additions & 0 deletions b/‎tests/e2e/scenarios/errorDisplay.spec.ts‎
Lines changed: 126 additions & 0 deletions
diff --git a/‎tests/e2e/scenarios/ipcRobustness.spec.ts‎
Lines changed: 88 additions & 0 deletions b/‎tests/e2e/scenarios/ipcRobustness.spec.ts‎
Lines changed: 88 additions & 0 deletions
@@ -148,9 +148,21 @@ jobs:
         run: make test-storybook
 
   e2e-test:
-    name: End-to-End Tests
-    runs-on: ${{ github.repository_owner == 'coder' && 'depot-ubuntu-22.04-16' || 'ubuntu-latest' }}
+    name: E2E Tests (${{ matrix.os }})
     if: github.event.inputs.test_filter == ''
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          # Linux: comprehensive E2E tests
+          - os: linux
+            runner: ${{ github.repository_owner == 'coder' && 'depot-ubuntu-22.04-16' || 'ubuntu-latest' }}
+            test_scope: "all"
+          # macOS: window lifecycle and platform-dependent tests only
+          - os: macos
+            runner: macos-latest
+            test_scope: "window-lifecycle"
+    runs-on: ${{ matrix.runner }}
     steps:
       - name: Checkout code
         uses: actions/checkout@v4
@@ -159,18 +171,24 @@ jobs:
 
       - uses: ./.github/actions/setup-mux
 
-      - name: Install xvfb
+      - name: Install xvfb (Linux)
+        if: matrix.os == 'linux'
         run: |
           sudo apt-get update
           sudo apt-get install -y xvfb
 
       - uses: ./.github/actions/setup-playwright
 
-      - name: Run e2e tests
+      - name: Run comprehensive e2e tests (Linux)
+        if: matrix.os == 'linux'
         run: xvfb-run -a make test-e2e
         env:
           ELECTRON_DISABLE_SANDBOX: 1
 
+      - name: Run window lifecycle e2e tests (macOS)
+        if: matrix.os == 'macos'
+        run: make test-e2e PLAYWRIGHT_ARGS="tests/e2e/scenarios/windowLifecycle.spec.ts"
+
   docker-smoke-test:
     name: Docker Smoke Test
     runs-on: ${{ github.repository_owner == 'coder' && 'depot-ubuntu-22.04-16' || 'ubuntu-latest' }}
 
@@ -3,6 +3,7 @@ import * as review from "./scenarios/review";
 import * as toolFlows from "./scenarios/toolFlows";
 import * as slashCommands from "./scenarios/slashCommands";
 import * as permissionModes from "./scenarios/permissionModes";
+import * as errorScenarios from "./scenarios/errorScenarios";
 import type { ScenarioTurn } from "./scenarioTypes";
 
 export const allScenarios: ScenarioTurn[] = [
@@ -11,4 +12,5 @@ export const allScenarios: ScenarioTurn[] = [
   ...toolFlows.scenarios,
   ...slashCommands.scenarios,
   ...permissionModes.scenarios,
+  ...errorScenarios.scenarios,
 ];
@@ -0,0 +1,91 @@
+import type { ScenarioTurn } from "@/node/services/mock/scenarioTypes";
+import { STREAM_BASE_DELAY } from "@/node/services/mock/scenarioTypes";
+import { KNOWN_MODELS } from "@/common/constants/knownModels";
+
+export const ERROR_PROMPTS = {
+  TRIGGER_RATE_LIMIT: "Trigger rate limit error",
+  TRIGGER_API_ERROR: "Trigger API error",
+  TRIGGER_NETWORK_ERROR: "Trigger network error",
+} as const;
+
+const rateLimitErrorTurn: ScenarioTurn = {
+  user: {
+    text: ERROR_PROMPTS.TRIGGER_RATE_LIMIT,
+    thinkingLevel: "low",
+    mode: "exec",
+  },
+  assistant: {
+    messageId: "msg-error-ratelimit",
+    events: [
+      {
+        kind: "stream-start",
+        delay: 0,
+        messageId: "msg-error-ratelimit",
+        model: KNOWN_MODELS.GPT.id,
+      },
+      {
+        kind: "stream-delta",
+        delay: STREAM_BASE_DELAY,
+        text: "Processing your request...",
+      },
+      {
+        kind: "stream-error",
+        delay: STREAM_BASE_DELAY * 2,
+        error: "Rate limit exceeded. Please retry after 60 seconds.",
+        errorType: "rate_limit",
+      },
+    ],
+  },
+};
+
+const apiErrorTurn: ScenarioTurn = {
+  user: {
+    text: ERROR_PROMPTS.TRIGGER_API_ERROR,
+    thinkingLevel: "low",
+    mode: "exec",
+  },
+  assistant: {
+    messageId: "msg-error-api",
+    events: [
+      {
+        kind: "stream-start",
+        delay: 0,
+        messageId: "msg-error-api",
+        model: KNOWN_MODELS.GPT.id,
+      },
+      {
+        kind: "stream-error",
+        delay: STREAM_BASE_DELAY,
+        error: "Internal server error occurred while processing the request.",
+        errorType: "server_error",
+      },
+    ],
+  },
+};
+
+const networkErrorTurn: ScenarioTurn = {
+  user: {
+    text: ERROR_PROMPTS.TRIGGER_NETWORK_ERROR,
+    thinkingLevel: "low",
+    mode: "exec",
+  },
+  assistant: {
+    messageId: "msg-error-network",
+    events: [
+      {
+        kind: "stream-start",
+        delay: 0,
+        messageId: "msg-error-network",
+        model: KNOWN_MODELS.GPT.id,
+      },
+      {
+        kind: "stream-error",
+        delay: STREAM_BASE_DELAY,
+        error: "Network connection lost. Please check your internet connection.",
+        errorType: "network",
+      },
+    ],
+  },
+};
+
+export const scenarios: ScenarioTurn[] = [rateLimitErrorTurn, apiErrorTurn, networkErrorTurn];
@@ -0,0 +1,126 @@
+import { electronTest as test, electronExpect as expect } from "../electronTest";
+import { ERROR_PROMPTS } from "@/node/services/mock/scenarios/errorScenarios";
+import { LIST_PROGRAMMING_LANGUAGES } from "@/node/services/mock/scenarios/basicChat";
+
+test.skip(
+  ({ browserName }) => browserName !== "chromium",
+  "Electron scenario runs on chromium only"
+);
+
+test.describe("error display", () => {
+  test("rate limit error shows in transcript with message", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_RATE_LIMIT);
+    });
+
+    // Error message should be visible in the transcript
+    const transcript = page.getByRole("log", { name: "Conversation transcript" });
+    await expect(transcript).toBeVisible();
+
+    // Should show the rate limit error text
+    await expect(
+      transcript.getByText("Rate limit exceeded. Please retry after 60 seconds.")
+    ).toBeVisible();
+  });
+
+  test("server error shows in transcript", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_API_ERROR);
+    });
+
+    const transcript = page.getByRole("log", { name: "Conversation transcript" });
+    await expect(
+      transcript.getByText("Internal server error occurred while processing the request.")
+    ).toBeVisible();
+  });
+
+  test("network error shows in transcript", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_NETWORK_ERROR);
+    });
+
+    const transcript = page.getByRole("log", { name: "Conversation transcript" });
+    await expect(
+      transcript.getByText("Network connection lost. Please check your internet connection.")
+    ).toBeVisible();
+  });
+
+  test("app remains functional after error", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    // Trigger an error
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_API_ERROR);
+    });
+
+    // Verify app is still functional - can open settings
+    await ui.settings.open();
+    await ui.settings.expectOpen();
+    await ui.settings.close();
+
+    // Chat input should still be usable
+    const chatInput = page.getByRole("textbox", { name: /message/i });
+    await expect(chatInput).toBeVisible();
+    await expect(chatInput).toBeEnabled();
+  });
+
+  test("multiple errors don't crash app", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    // Trigger multiple errors in sequence
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_RATE_LIMIT);
+    });
+
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_API_ERROR);
+    });
+
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_NETWORK_ERROR);
+    });
+
+    // App should still be responsive
+    await expect(page.getByRole("navigation", { name: "Projects" })).toBeVisible();
+
+    // Can still send a normal message after errors
+    await ui.chat.setMode("Plan");
+    const timeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    expect(timeline.events.some((e) => e.type === "stream-end")).toBe(true);
+  });
+
+  test("error state clears on successful message", async ({ ui }) => {
+    await ui.projects.openFirstWorkspace();
+    await ui.chat.setMode("Exec");
+
+    // Trigger an error first
+    const errorTimeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(ERROR_PROMPTS.TRIGGER_API_ERROR);
+    });
+    expect(errorTimeline.events.some((e) => e.type === "stream-error")).toBe(true);
+
+    // Send a successful message
+    await ui.chat.setMode("Plan");
+    const successTimeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    // Should complete successfully
+    expect(successTimeline.events.some((e) => e.type === "stream-end")).toBe(true);
+    await ui.chat.expectTranscriptContains("Python");
+  });
+});
@@ -0,0 +1,88 @@
+import { electronTest as test, electronExpect as expect } from "../electronTest";
+import { LIST_PROGRAMMING_LANGUAGES } from "@/node/services/mock/scenarios/basicChat";
+
+test.skip(
+  ({ browserName }) => browserName !== "chromium",
+  "Electron scenario runs on chromium only"
+);
+
+test.describe("IPC robustness", () => {
+  test("IPC calls during stream don't race", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+
+    // First, send a message and wait for it to complete
+    const timeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    expect(timeline.events.length).toBeGreaterThan(0);
+    expect(timeline.events[timeline.events.length - 1]?.type).toBe("stream-end");
+
+    // Now trigger IPC calls by opening/closing settings rapidly
+    await ui.settings.open();
+    await ui.settings.close();
+    await ui.settings.open();
+    await ui.settings.close();
+
+    // Verify app is still responsive and transcript preserved
+    await ui.chat.expectTranscriptContains("Python");
+  });
+
+  test("concurrent IPC calls resolve correctly", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+
+    // Trigger multiple UI operations that involve IPC
+    await ui.settings.open();
+    await ui.settings.selectSection("Providers");
+    await ui.settings.selectSection("Models");
+    await ui.settings.close();
+
+    // Immediately try to send a message
+    const timeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    expect(timeline.events.length).toBeGreaterThan(0);
+    await ui.chat.expectTranscriptContains("JavaScript");
+  });
+
+  test("rapid workspace interactions don't corrupt state", async ({ ui }) => {
+    await ui.projects.openFirstWorkspace();
+
+    // Send a message
+    await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    // Toggle mode rapidly - this exercises IPC without starting new streams
+    await ui.chat.setMode("Exec");
+    await ui.chat.setMode("Plan");
+
+    // Should still show previous messages after mode switching
+    await ui.chat.expectTranscriptContains("Python");
+    await ui.chat.expectTranscriptContains("JavaScript");
+    await ui.chat.expectTranscriptContains("Rust");
+  });
+
+  test("settings changes during chat don't cause errors", async ({ ui, page }) => {
+    await ui.projects.openFirstWorkspace();
+
+    // Open settings
+    await ui.settings.open();
+
+    // Navigate around settings
+    await ui.settings.selectSection("Providers");
+    await ui.settings.selectSection("General");
+
+    // Close settings
+    await ui.settings.close();
+
+    // Send a message - should work normally
+    const timeline = await ui.chat.captureStreamTimeline(async () => {
+      await ui.chat.sendMessage(LIST_PROGRAMMING_LANGUAGES);
+    });
+
+    expect(timeline.events.length).toBeGreaterThan(0);
+    expect(timeline.events.some((e) => e.type === "stream-end")).toBe(true);
+  });
+});