stacklok
diff --git a/‎common/app-info.ts‎
Lines changed: 0 additions & 3 deletions b/‎common/app-info.ts‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎e2e-tests/helpers/app-relaunch.ts‎
Lines changed: 173 additions & 0 deletions b/‎e2e-tests/helpers/app-relaunch.ts‎
Lines changed: 173 additions & 0 deletions
diff --git a/‎e2e-tests/mcp-optimizer-startup-cleanup.spec.ts‎
Lines changed: 186 additions & 0 deletions b/‎e2e-tests/mcp-optimizer-startup-cleanup.spec.ts‎
Lines changed: 186 additions & 0 deletions
@@ -49,14 +49,11 @@ export const GITHUB_PAGES_MANIFEST_URL =
 export const DOCS_BASE_URL = 'https://docs.stacklok.com/toolhive'
 export const DISCORD_URL = 'https://discord.gg/stacklok'
 export const DEMO_URL = 'https://stacklok.com/demo/'
-export const MCP_OPTIMIZER_SUNSET_BLOG_URL =
-  'https://stacklok.com/blog/mcp-optimizer-is-now-built-into-the-stacklok-platform/'
 
 // ── Registry ─────────────────────────────────────────────────────────────────
 
 export const DEFAULT_REGISTRY_JSON_URL =
   'https://raw.githubusercontent.com/stacklok/toolhive/refs/heads/main/pkg/registry/data/registry.json'
-export const MCP_OPTIMIZER_IMAGE = 'ghcr.io/stackloklabs/mcp-optimizer'
 
 // ── Privacy / legal ──────────────────────────────────────────────────────────
 
 
@@ -0,0 +1,173 @@
+import path from 'path'
+import {
+  _electron as electron,
+  type ElectronApplication,
+  type Page,
+} from '@playwright/test'
+
+function getExecutablePath(): string {
+  const platform = process.platform
+  const arch = process.arch
+  const basePath = path.join(__dirname, '..', '..', 'out')
+
+  if (platform === 'darwin') {
+    return path.join(
+      basePath,
+      `ToolHive-darwin-${arch}`,
+      'ToolHive.app',
+      'Contents',
+      'MacOS',
+      'ToolHive'
+    )
+  } else if (platform === 'win32') {
+    return path.join(basePath, `ToolHive-win32-${arch}`, 'ToolHive.exe')
+  } else {
+    return path.join(basePath, `ToolHive-linux-${arch}`, 'ToolHive')
+  }
+}
+
+export interface LaunchedApp {
+  app: ElectronApplication
+  window: Page
+  baseUrl: string
+  /**
+   * Terminate the app without waiting on the renderer's before-quit teardown.
+   *
+   * On Linux CI the regular `ElectronApplication.close()` has been observed to
+   * hang indefinitely when a session has seeded a running workload via the thv
+   * API (the graceful shutdown path waits on a remote workload that never
+   * drains). We bypass that path via `app.exit(0)` and fall back to SIGKILL.
+   */
+  close: () => Promise<void>
+}
+
+/**
+ * Launch the Electron app bound to a specific userDataDir so the same
+ * directory can be reused across launches within a single test.
+ *
+ * Mirrors the setup in e2e-tests/fixtures/electron.ts but exposes the raw
+ * app/window instead of running the shared MCP server group bootstrap.
+ */
+export async function launchApp(userDataDir: string): Promise<LaunchedApp> {
+  const app = await electron.launch({
+    executablePath: getExecutablePath(),
+    ...(process.env.CI ? { recordVideo: { dir: 'test-videos' } } : {}),
+    args: ['--no-sandbox', `--user-data-dir=${userDataDir}`],
+    env: {
+      ...process.env,
+      TOOLHIVE_E2E: 'true',
+    },
+  })
+
+  const window = await app.firstWindow()
+
+  await window.route('https://*.sentry.io/**', (route) => {
+    throw new Error(`Sentry request blocked: ${route.request().url()}`)
+  })
+
+  // Disable quit confirmation dialog as a safety net; our close() helper also
+  // force-exits, so this mostly keeps manual tear-downs clean.
+  await window.evaluate(async () => {
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    await (globalThis as any).electronAPI.setSkipQuitConfirmation(true)
+  })
+
+  await window.getByRole('link', { name: /mcp servers/i }).waitFor()
+
+  const port = await window.evaluate(async () => {
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    return (await (globalThis as any).electronAPI.getToolhivePort()) as number
+  })
+
+  if (!port) {
+    throw new Error('Failed to resolve ToolHive port from the launched app')
+  }
+
+  const baseUrl = `http://127.0.0.1:${port}`
+
+  await waitForThvReady(baseUrl)
+
+  const close = async () => {
+    // Force an immediate exit via Electron's app.exit(), bypassing before-quit
+    // handlers, the confirmation dialog, and any pending graceful-shutdown
+    // work (e.g. waiting on seeded workloads to drain).
+    try {
+      await app.evaluate(({ app: electronApp }) => electronApp.exit(0))
+    } catch {
+      // Renderer/main may already be gone; ignore.
+    }
+
+    // Give the process a short window to exit cleanly, then hard-kill.
+    const proc = app.process()
+    await Promise.race([
+      app.close().catch(() => {}),
+      new Promise<void>((resolve) => setTimeout(resolve, 5_000)),
+    ])
+
+    if (proc.exitCode === null && !proc.killed) {
+      try {
+        proc.kill('SIGKILL')
+      } catch {
+        // Process may have exited between the check and the kill.
+      }
+    }
+  }
+
+  return { app, window, baseUrl, close }
+}
+
+/**
+ * Thin wrapper around `fetch` that raises on non-2xx/4xx responses the caller
+ * wants to treat as failures, optionally returning parsed JSON.
+ */
+export async function thvFetch<T = unknown>(
+  baseUrl: string,
+  apiPath: string,
+  init?: RequestInit & { expectStatus?: number[] }
+): Promise<{ status: number; json: T | null }> {
+  const { expectStatus, ...rest } = init ?? {}
+  const res = await fetch(`${baseUrl}${apiPath}`, {
+    ...rest,
+    headers: {
+      'content-type': 'application/json',
+      ...(rest.headers ?? {}),
+    },
+  })
+
+  if (expectStatus && !expectStatus.includes(res.status)) {
+    const body = await res.text()
+    throw new Error(
+      `thvFetch ${apiPath} expected status in [${expectStatus.join(',')}], got ${res.status}: ${body}`
+    )
+  }
+
+  const text = await res.text()
+  let json: T | null = null
+  if (text) {
+    try {
+      json = JSON.parse(text) as T
+    } catch {
+      json = null
+    }
+  }
+  return { status: res.status, json }
+}
+
+async function waitForThvReady(
+  baseUrl: string,
+  { timeoutMs = 30_000 } = {}
+): Promise<void> {
+  const deadline = Date.now() + timeoutMs
+  while (Date.now() < deadline) {
+    try {
+      const res = await fetch(`${baseUrl}/api/v1beta/groups`)
+      if (res.ok) return
+    } catch {
+      // keep polling
+    }
+    await new Promise((resolve) => setTimeout(resolve, 250))
+  }
+  throw new Error(
+    `ToolHive API at ${baseUrl} did not become ready within ${timeoutMs}ms`
+  )
+}
@@ -0,0 +1,186 @@
+import path from 'path'
+import fs from 'fs'
+import os from 'os'
+import { execSync } from 'child_process'
+import { test, expect } from '@playwright/test'
+import { launchApp, thvFetch, type LaunchedApp } from './helpers/app-relaunch'
+import {
+  startTestMcpServer,
+  type TestMcpServer,
+} from './helpers/test-mcp-server'
+
+const OPTIMIZER_GROUP = '__mcp-optimizer__'
+const META_MCP_SERVER = 'toolhive-mcp-optimizer'
+const CUSTOM_GROUP = 'pw-optimizer-custom'
+const TEST_CLIENT = 'vscode'
+
+function getThvPath(): string {
+  const platform = process.platform
+  const arch = process.arch
+  const binName = platform === 'win32' ? 'thv.exe' : 'thv'
+  return path.join(__dirname, '..', 'bin', `${platform}-${arch}`, binName)
+}
+
+/**
+ * Best-effort cleanup of leftover groups via the thv CLI. The CLI requires a
+ * Docker-compatible runtime but we already require that for e2e tests.
+ */
+function bestEffortCliCleanup(): void {
+  const thvPath = getThvPath()
+  const env = { ...process.env, TOOLHIVE_SKIP_DESKTOP_CHECK: 'true' }
+  for (const group of [OPTIMIZER_GROUP, CUSTOM_GROUP]) {
+    try {
+      execSync(`"${thvPath}" group rm "${group}" --with-workloads`, {
+        input: 'y\n',
+        stdio: ['pipe', 'ignore', 'ignore'],
+        env,
+      })
+    } catch {
+      // Group does not exist - that's the happy path.
+    }
+  }
+}
+
+async function createGroupViaUi(
+  launched: LaunchedApp,
+  groupName: string
+): Promise<void> {
+  const { window } = launched
+  await window.getByRole('button', { name: /add a group/i }).click()
+  await window.getByRole('dialog').waitFor()
+  await window.getByLabel(/name/i).fill(groupName)
+  await window.getByRole('button', { name: /create/i }).click()
+  await window.getByRole('dialog').waitFor({ state: 'hidden' })
+}
+
+async function seedOptimizerState(
+  baseUrl: string,
+  testServer: TestMcpServer
+): Promise<void> {
+  await thvFetch(baseUrl, '/api/v1beta/groups', {
+    method: 'POST',
+    body: JSON.stringify({ name: OPTIMIZER_GROUP }),
+    expectStatus: [200, 201],
+  })
+
+  await thvFetch(baseUrl, '/api/v1beta/clients/register', {
+    method: 'POST',
+    body: JSON.stringify({
+      names: [TEST_CLIENT],
+      groups: [OPTIMIZER_GROUP],
+    }),
+    expectStatus: [200, 201],
+  })
+
+  // Create a remote meta-mcp workload so GET /workloads/meta-mcp later returns
+  // the ALLOWED_GROUPS env var that drives the restoration path. A remote
+  // workload avoids any Docker image pull complications.
+  await thvFetch(baseUrl, '/api/v1beta/workloads', {
+    method: 'POST',
+    body: JSON.stringify({
+      name: META_MCP_SERVER,
+      group: OPTIMIZER_GROUP,
+      url: testServer.url,
+      transport: 'streamable-http',
+      env_vars: {
+        ALLOWED_GROUPS: CUSTOM_GROUP,
+      },
+    }),
+    expectStatus: [200, 201, 202],
+  })
+}
+
+async function waitForOptimizerCleanup(baseUrl: string): Promise<void> {
+  await expect
+    .poll(
+      async () => {
+        const { json } = await thvFetch<{
+          groups?: Array<{ name?: string; registered_clients?: string[] }>
+        }>(baseUrl, '/api/v1beta/groups', { expectStatus: [200] })
+        const groups = json?.groups ?? []
+        const optimizerGroup = groups.find((g) => g.name === OPTIMIZER_GROUP)
+        const customGroup = groups.find((g) => g.name === CUSTOM_GROUP)
+        return {
+          optimizerGone: !optimizerGroup,
+          customHasClient:
+            customGroup?.registered_clients?.includes(TEST_CLIENT) ?? false,
+        }
+      },
+      // App-side readiness wait can itself take up to TOOLHIVE_READY_MAX_WAIT_MS
+      // (60s). Give the poll a budget that exceeds that plus cleanup time so
+      // slow CI runners don't flake even though in practice this completes
+      // well under a second.
+      { timeout: 120_000, intervals: [500, 1000, 2000] }
+    )
+    .toEqual({ optimizerGone: true, customHasClient: true })
+}
+
+test.describe('MCP Optimizer startup cleanup', () => {
+  let userDataDir: string
+  let testServer: TestMcpServer
+
+  test.beforeAll(async () => {
+    bestEffortCliCleanup()
+    testServer = await startTestMcpServer()
+  })
+
+  test.afterAll(async () => {
+    await testServer?.stop()
+    bestEffortCliCleanup()
+  })
+
+  test.beforeEach(() => {
+    userDataDir = fs.mkdtempSync(
+      path.join(os.tmpdir(), 'toolhive-e2e-optimizer-cleanup-')
+    )
+  })
+
+  test.afterEach(() => {
+    fs.rmSync(userDataDir, { recursive: true, force: true })
+  })
+
+  test('restores clients to the custom group and deletes __mcp-optimizer__ on next launch', async () => {
+    // Session 1: seed the legacy MCP Optimizer state.
+    const firstLaunch = await launchApp(userDataDir)
+    try {
+      await createGroupViaUi(firstLaunch, CUSTOM_GROUP)
+      await seedOptimizerState(firstLaunch.baseUrl, testServer)
+
+      // Sanity: both groups exist and optimizer has the registered client.
+      const { json: seeded } = await thvFetch<{
+        groups?: Array<{ name?: string; registered_clients?: string[] }>
+      }>(firstLaunch.baseUrl, '/api/v1beta/groups', { expectStatus: [200] })
+      const seededOptimizer = seeded?.groups?.find(
+        (g) => g.name === OPTIMIZER_GROUP
+      )
+      expect(seededOptimizer?.registered_clients).toContain(TEST_CLIENT)
+      expect(seeded?.groups?.some((g) => g.name === CUSTOM_GROUP)).toBe(true)
+    } finally {
+      await firstLaunch.close()
+    }
+
+    // Session 2: relaunching with the same userDataDir should trigger the
+    // startup cleanup hook, which restores clients and deletes the group.
+    const secondLaunch = await launchApp(userDataDir)
+    try {
+      await waitForOptimizerCleanup(secondLaunch.baseUrl)
+
+      // The meta-mcp workload is deleted as part of ?with-workloads=true.
+      const { status: workloadStatus } = await thvFetch(
+        secondLaunch.baseUrl,
+        `/api/v1beta/workloads/${META_MCP_SERVER}`
+      )
+      expect(workloadStatus).toBe(404)
+
+      // The user's custom group is preserved.
+      const { json: finalGroups } = await thvFetch<{
+        groups?: Array<{ name?: string }>
+      }>(secondLaunch.baseUrl, '/api/v1beta/groups', { expectStatus: [200] })
+      expect(finalGroups?.groups?.some((g) => g.name === CUSTOM_GROUP)).toBe(
+        true
+      )
+    } finally {
+      await secondLaunch.close()
+    }
+  })
+})